diff --git "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" --- "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" +++ "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.1162, "train/learning_rate": 2.396080760095012e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 100541, "_timestamp": 1647475083, "_step": 16510, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 5.0, 7.0, 13.0, 13.0, 14.0, 16.0, 24.0, 18.0, 27.0, 22.0, 32.0, 34.0, 39.0, 42.0, 38.0, 50.0, 41.0, 35.0, 45.0, 52.0, 49.0, 63.0, 53.0, 49.0, 31.0, 29.0, 28.0, 28.0, 19.0, 22.0, 11.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.658233642578125, -22.21038818359375, -21.762540817260742, -21.314695358276367, -20.86684799194336, -20.419002532958984, -19.971155166625977, -19.5233097076416, -19.075462341308594, -18.62761688232422, -18.17976951599121, -17.731924057006836, -17.284076690673828, -16.836231231689453, -16.388383865356445, -15.940537452697754, -15.492691040039062, -15.044844627380371, -14.59699821472168, -14.149151802062988, -13.701305389404297, -13.253458976745605, -12.805612564086914, -12.357766151428223, -11.909920692443848, -11.462074279785156, -11.014227867126465, -10.566381454467773, -10.118535041809082, -9.67068862915039, -9.2228422164917, -8.774995803833008, -8.3271484375, -7.879302024841309, -7.431455612182617, -6.983609199523926, -6.535762786865234, -6.087916374206543, -5.640069961547852, -5.19222354888916, -4.744378089904785, -4.296531677246094, -3.8486852645874023, -3.400838851928711, -2.9529924392700195, -2.5051462650299072, -2.057299852371216, -1.6094534397125244, -1.161606788635254, -0.7137603759765625, -0.26591402292251587, 0.18193233013153076, 0.6297787427902222, 1.077625036239624, 1.5254714488983154, 1.9733178615570068, 2.4211642742156982, 2.8690106868743896, 3.316857099533081, 3.7647032737731934, 4.212549686431885, 4.660396099090576, 5.108242511749268, 5.556088924407959, 6.00393533706665]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 12.0, 8.0, 7.0, 10.0, 10.0, 20.0, 22.0, 27.0, 22.0, 36.0, 28.0, 40.0, 23.0, 43.0, 36.0, 40.0, 39.0, 40.0, 48.0, 36.0, 49.0, 35.0, 33.0, 41.0, 34.0, 25.0, 38.0, 39.0, 23.0, 17.0, 28.0, 7.0, 15.0, 11.0, 10.0, 9.0, 12.0, 3.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.937238693237305, -10.542332649230957, -10.147427558898926, -9.752521514892578, -9.357616424560547, -8.9627103805542, -8.567804336547852, -8.17289924621582, -7.777993202209473, -7.383087635040283, -6.988182067871094, -6.593276023864746, -6.198370456695557, -5.803464889526367, -5.4085588455200195, -5.01365327835083, -4.618747711181641, -4.223842144012451, -3.8289363384246826, -3.434030532836914, -3.0391249656677246, -2.644219398498535, -2.2493135929107666, -1.854407787322998, -1.4595022201538086, -1.0645965337753296, -0.6696908473968506, -0.2747851610183716, 0.12012052536010742, 0.5150262117385864, 0.9099318981170654, 1.304837703704834, 1.699742317199707, 2.0946478843688965, 2.489553689956665, 2.8844594955444336, 3.279365062713623, 3.6742706298828125, 4.06917667388916, 4.46408224105835, 4.858987808227539, 5.2538933753967285, 5.648798942565918, 6.043704986572266, 6.438610553741455, 6.8335161209106445, 7.228422164916992, 7.623327732086182, 8.018233299255371, 8.413139343261719, 8.80804443359375, 9.202950477600098, 9.597856521606445, 9.992761611938477, 10.387667655944824, 10.782573699951172, 11.177478790283203, 11.57238483428955, 11.967289924621582, 12.36219596862793, 12.757101058959961, 13.152007102966309, 13.546913146972656, 13.941818237304688, 14.336724281311035]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 16.0, 27.0, 40.0, 75.0, 105.0, 241.0, 342.0, 591.0, 1024.0, 1733.0, 2988.0, 4942.0, 8143.0, 13582.0, 22324.0, 37715.0, 63581.0, 108695.0, 185973.0, 320843.0, 535980.0, 767567.0, 776799.0, 548884.0, 328997.0, 190928.0, 111553.0, 65327.0, 38960.0, 23011.0, 13550.0, 8066.0, 4879.0, 2877.0, 1628.0, 953.0, 583.0, 347.0, 172.0, 108.0, 65.0, 35.0, 16.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.03125, -26.212646484375, -25.39404296875, -24.575439453125, -23.7568359375, -22.938232421875, -22.11962890625, -21.301025390625, -20.482421875, -19.663818359375, -18.84521484375, -18.026611328125, -17.2080078125, -16.389404296875, -15.57080078125, -14.752197265625, -13.93359375, -13.114990234375, -12.29638671875, -11.477783203125, -10.6591796875, -9.840576171875, -9.02197265625, -8.203369140625, -7.384765625, -6.566162109375, -5.74755859375, -4.928955078125, -4.1103515625, -3.291748046875, -2.47314453125, -1.654541015625, -0.8359375, -0.017333984375, 0.80126953125, 1.619873046875, 2.4384765625, 3.257080078125, 4.07568359375, 4.894287109375, 5.712890625, 6.531494140625, 7.35009765625, 8.168701171875, 8.9873046875, 9.805908203125, 10.62451171875, 11.443115234375, 12.26171875, 13.080322265625, 13.89892578125, 14.717529296875, 15.5361328125, 16.354736328125, 17.17333984375, 17.991943359375, 18.810546875, 19.629150390625, 20.44775390625, 21.266357421875, 22.0849609375, 22.903564453125, 23.72216796875, 24.540771484375, 25.359375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 5.0, 13.0, 13.0, 14.0, 25.0, 18.0, 20.0, 29.0, 26.0, 34.0, 26.0, 36.0, 31.0, 35.0, 55.0, 31.0, 37.0, 41.0, 42.0, 39.0, 41.0, 30.0, 38.0, 34.0, 32.0, 29.0, 32.0, 30.0, 29.0, 21.0, 27.0, 13.0, 11.0, 10.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.9453125, -13.50341796875, -13.0615234375, -12.61962890625, -12.177734375, -11.73583984375, -11.2939453125, -10.85205078125, -10.41015625, -9.96826171875, -9.5263671875, -9.08447265625, -8.642578125, -8.20068359375, -7.7587890625, -7.31689453125, -6.875, -6.43310546875, -5.9912109375, -5.54931640625, -5.107421875, -4.66552734375, -4.2236328125, -3.78173828125, -3.33984375, -2.89794921875, -2.4560546875, -2.01416015625, -1.572265625, -1.13037109375, -0.6884765625, -0.24658203125, 0.1953125, 0.63720703125, 1.0791015625, 1.52099609375, 1.962890625, 2.40478515625, 2.8466796875, 3.28857421875, 3.73046875, 4.17236328125, 4.6142578125, 5.05615234375, 5.498046875, 5.93994140625, 6.3818359375, 6.82373046875, 7.265625, 7.70751953125, 8.1494140625, 8.59130859375, 9.033203125, 9.47509765625, 9.9169921875, 10.35888671875, 10.80078125, 11.24267578125, 11.6845703125, 12.12646484375, 12.568359375, 13.01025390625, 13.4521484375, 13.89404296875, 14.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 18.0, 19.0, 34.0, 44.0, 62.0, 103.0, 178.0, 257.0, 453.0, 740.0, 1197.0, 1903.0, 3084.0, 5115.0, 8553.0, 13968.0, 23589.0, 39481.0, 65885.0, 110372.0, 183649.0, 295675.0, 451137.0, 617613.0, 685910.0, 585661.0, 417225.0, 268178.0, 165987.0, 99795.0, 59373.0, 35570.0, 21445.0, 12669.0, 7592.0, 4454.0, 2816.0, 1727.0, 1038.0, 632.0, 412.0, 227.0, 171.0, 91.0, 66.0, 40.0, 21.0, 24.0, 10.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-20.390625, -19.76123046875, -19.1318359375, -18.50244140625, -17.873046875, -17.24365234375, -16.6142578125, -15.98486328125, -15.35546875, -14.72607421875, -14.0966796875, -13.46728515625, -12.837890625, -12.20849609375, -11.5791015625, -10.94970703125, -10.3203125, -9.69091796875, -9.0615234375, -8.43212890625, -7.802734375, -7.17333984375, -6.5439453125, -5.91455078125, -5.28515625, -4.65576171875, -4.0263671875, -3.39697265625, -2.767578125, -2.13818359375, -1.5087890625, -0.87939453125, -0.25, 0.37939453125, 1.0087890625, 1.63818359375, 2.267578125, 2.89697265625, 3.5263671875, 4.15576171875, 4.78515625, 5.41455078125, 6.0439453125, 6.67333984375, 7.302734375, 7.93212890625, 8.5615234375, 9.19091796875, 9.8203125, 10.44970703125, 11.0791015625, 11.70849609375, 12.337890625, 12.96728515625, 13.5966796875, 14.22607421875, 14.85546875, 15.48486328125, 16.1142578125, 16.74365234375, 17.373046875, 18.00244140625, 18.6318359375, 19.26123046875, 19.890625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 2.0, 10.0, 13.0, 16.0, 17.0, 24.0, 33.0, 37.0, 55.0, 60.0, 68.0, 77.0, 102.0, 92.0, 135.0, 159.0, 152.0, 156.0, 184.0, 223.0, 237.0, 213.0, 245.0, 223.0, 227.0, 198.0, 161.0, 126.0, 119.0, 121.0, 90.0, 72.0, 75.0, 74.0, 53.0, 49.0, 44.0, 26.0, 20.0, 16.0, 16.0, 13.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.68359375, -7.44696044921875, -7.2103271484375, -6.97369384765625, -6.737060546875, -6.50042724609375, -6.2637939453125, -6.02716064453125, -5.79052734375, -5.55389404296875, -5.3172607421875, -5.08062744140625, -4.843994140625, -4.60736083984375, -4.3707275390625, -4.13409423828125, -3.8974609375, -3.66082763671875, -3.4241943359375, -3.18756103515625, -2.950927734375, -2.71429443359375, -2.4776611328125, -2.24102783203125, -2.00439453125, -1.76776123046875, -1.5311279296875, -1.29449462890625, -1.057861328125, -0.82122802734375, -0.5845947265625, -0.34796142578125, -0.111328125, 0.12530517578125, 0.3619384765625, 0.59857177734375, 0.835205078125, 1.07183837890625, 1.3084716796875, 1.54510498046875, 1.78173828125, 2.01837158203125, 2.2550048828125, 2.49163818359375, 2.728271484375, 2.96490478515625, 3.2015380859375, 3.43817138671875, 3.6748046875, 3.91143798828125, 4.1480712890625, 4.38470458984375, 4.621337890625, 4.85797119140625, 5.0946044921875, 5.33123779296875, 5.56787109375, 5.80450439453125, 6.0411376953125, 6.27777099609375, 6.514404296875, 6.75103759765625, 6.9876708984375, 7.22430419921875, 7.4609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 3.0, 11.0, 16.0, 10.0, 17.0, 14.0, 11.0, 17.0, 22.0, 33.0, 24.0, 40.0, 42.0, 52.0, 48.0, 45.0, 48.0, 56.0, 48.0, 58.0, 40.0, 54.0, 42.0, 32.0, 38.0, 30.0, 23.0, 24.0, 18.0, 13.0, 11.0, 13.0, 15.0, 2.0, 10.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-21.853532791137695, -21.262256622314453, -20.67098045349121, -20.07970428466797, -19.488426208496094, -18.89715003967285, -18.30587387084961, -17.714597702026367, -17.123321533203125, -16.532045364379883, -15.94076919555664, -15.349492073059082, -14.75821590423584, -14.166939735412598, -13.575662612915039, -12.984386444091797, -12.393110275268555, -11.801834106445312, -11.21055793762207, -10.619280815124512, -10.02800464630127, -9.436728477478027, -8.845451354980469, -8.254175186157227, -7.662899017333984, -7.071622848510742, -6.480346202850342, -5.889069557189941, -5.297793388366699, -4.706517219543457, -4.115240573883057, -3.5239639282226562, -2.9326858520507812, -2.34140944480896, -1.7501330375671387, -1.1588566303253174, -0.5675802230834961, 0.023696184158325195, 0.6149725914001465, 1.2062492370605469, 1.797525405883789, 2.3888018131256104, 2.9800782203674316, 3.571354627609253, 4.162631034851074, 4.753907203674316, 5.345183849334717, 5.936460494995117, 6.527736663818359, 7.119012832641602, 7.710289478302002, 8.301566123962402, 8.892842292785645, 9.484118461608887, 10.075395584106445, 10.666671752929688, 11.25794792175293, 11.849224090576172, 12.440500259399414, 13.031777381896973, 13.623053550720215, 14.214329719543457, 14.805606842041016, 15.396883010864258, 15.9881591796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 7.0, 6.0, 4.0, 9.0, 16.0, 15.0, 22.0, 22.0, 22.0, 29.0, 34.0, 34.0, 41.0, 39.0, 39.0, 68.0, 43.0, 45.0, 40.0, 36.0, 43.0, 50.0, 42.0, 24.0, 45.0, 40.0, 36.0, 25.0, 26.0, 25.0, 22.0, 18.0, 12.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.031862258911133, -19.448139190673828, -18.864416122436523, -18.28069305419922, -17.696971893310547, -17.113248825073242, -16.529525756835938, -15.945802688598633, -15.362079620361328, -14.778356552124023, -14.194633483886719, -13.61091136932373, -13.027188301086426, -12.443465232849121, -11.859743118286133, -11.276020050048828, -10.692296981811523, -10.108573913574219, -9.524850845336914, -8.941128730773926, -8.357405662536621, -7.773682594299316, -7.18996000289917, -6.606237411499023, -6.022514343261719, -5.438791275024414, -4.855068683624268, -4.271346092224121, -3.6876230239868164, -3.103900194168091, -2.5201773643493652, -1.9364547729492188, -1.352731704711914, -0.7690088748931885, -0.1852860450744629, 0.3984367847442627, 0.9821596145629883, 1.5658824443817139, 2.1496052742004395, 2.733327865600586, 3.3170509338378906, 3.900773763656616, 4.484496593475342, 5.068219184875488, 5.651942253112793, 6.235665321350098, 6.819387912750244, 7.403110504150391, 7.986833572387695, 8.570556640625, 9.154279708862305, 9.738001823425293, 10.321724891662598, 10.905447959899902, 11.48917007446289, 12.072893142700195, 12.6566162109375, 13.240339279174805, 13.82406234741211, 14.407784461975098, 14.991507530212402, 15.575230598449707, 16.158952713012695, 16.74267578125, 17.326398849487305]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 15.0, 22.0, 26.0, 45.0, 48.0, 90.0, 141.0, 209.0, 347.0, 511.0, 838.0, 1243.0, 1891.0, 2847.0, 4529.0, 7163.0, 11241.0, 18091.0, 29620.0, 48936.0, 81046.0, 127757.0, 172123.0, 176952.0, 136577.0, 87651.0, 53496.0, 32030.0, 19619.0, 12188.0, 7591.0, 4799.0, 3084.0, 2051.0, 1308.0, 812.0, 553.0, 368.0, 234.0, 155.0, 99.0, 66.0, 52.0, 30.0, 21.0, 10.0, 8.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.59375, -8.3172607421875, -8.040771484375, -7.7642822265625, -7.48779296875, -7.2113037109375, -6.934814453125, -6.6583251953125, -6.3818359375, -6.1053466796875, -5.828857421875, -5.5523681640625, -5.27587890625, -4.9993896484375, -4.722900390625, -4.4464111328125, -4.169921875, -3.8934326171875, -3.616943359375, -3.3404541015625, -3.06396484375, -2.7874755859375, -2.510986328125, -2.2344970703125, -1.9580078125, -1.6815185546875, -1.405029296875, -1.1285400390625, -0.85205078125, -0.5755615234375, -0.299072265625, -0.0225830078125, 0.25390625, 0.5303955078125, 0.806884765625, 1.0833740234375, 1.35986328125, 1.6363525390625, 1.912841796875, 2.1893310546875, 2.4658203125, 2.7423095703125, 3.018798828125, 3.2952880859375, 3.57177734375, 3.8482666015625, 4.124755859375, 4.4012451171875, 4.677734375, 4.9542236328125, 5.230712890625, 5.5072021484375, 5.78369140625, 6.0601806640625, 6.336669921875, 6.6131591796875, 6.8896484375, 7.1661376953125, 7.442626953125, 7.7191162109375, 7.99560546875, 8.2720947265625, 8.548583984375, 8.8250732421875, 9.1015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 8.0, 10.0, 16.0, 17.0, 18.0, 22.0, 22.0, 34.0, 32.0, 32.0, 44.0, 41.0, 41.0, 55.0, 54.0, 42.0, 38.0, 40.0, 44.0, 48.0, 39.0, 33.0, 38.0, 45.0, 29.0, 29.0, 28.0, 15.0, 27.0, 18.0, 11.0, 6.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.078125, -20.46337890625, -19.8486328125, -19.23388671875, -18.619140625, -18.00439453125, -17.3896484375, -16.77490234375, -16.16015625, -15.54541015625, -14.9306640625, -14.31591796875, -13.701171875, -13.08642578125, -12.4716796875, -11.85693359375, -11.2421875, -10.62744140625, -10.0126953125, -9.39794921875, -8.783203125, -8.16845703125, -7.5537109375, -6.93896484375, -6.32421875, -5.70947265625, -5.0947265625, -4.47998046875, -3.865234375, -3.25048828125, -2.6357421875, -2.02099609375, -1.40625, -0.79150390625, -0.1767578125, 0.43798828125, 1.052734375, 1.66748046875, 2.2822265625, 2.89697265625, 3.51171875, 4.12646484375, 4.7412109375, 5.35595703125, 5.970703125, 6.58544921875, 7.2001953125, 7.81494140625, 8.4296875, 9.04443359375, 9.6591796875, 10.27392578125, 10.888671875, 11.50341796875, 12.1181640625, 12.73291015625, 13.34765625, 13.96240234375, 14.5771484375, 15.19189453125, 15.806640625, 16.42138671875, 17.0361328125, 17.65087890625, 18.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 10.0, 13.0, 18.0, 17.0, 17.0, 30.0, 41.0, 86.0, 117.0, 182.0, 281.0, 408.0, 581.0, 1013.0, 1684.0, 2686.0, 4575.0, 7883.0, 15408.0, 34345.0, 772232.0, 152409.0, 25802.0, 12240.0, 6522.0, 3807.0, 2179.0, 1470.0, 835.0, 571.0, 344.0, 230.0, 161.0, 110.0, 72.0, 46.0, 37.0, 24.0, 15.0, 15.0, 9.0, 1.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.234375, -19.598876953125, -18.96337890625, -18.327880859375, -17.6923828125, -17.056884765625, -16.42138671875, -15.785888671875, -15.150390625, -14.514892578125, -13.87939453125, -13.243896484375, -12.6083984375, -11.972900390625, -11.33740234375, -10.701904296875, -10.06640625, -9.430908203125, -8.79541015625, -8.159912109375, -7.5244140625, -6.888916015625, -6.25341796875, -5.617919921875, -4.982421875, -4.346923828125, -3.71142578125, -3.075927734375, -2.4404296875, -1.804931640625, -1.16943359375, -0.533935546875, 0.1015625, 0.737060546875, 1.37255859375, 2.008056640625, 2.6435546875, 3.279052734375, 3.91455078125, 4.550048828125, 5.185546875, 5.821044921875, 6.45654296875, 7.092041015625, 7.7275390625, 8.363037109375, 8.99853515625, 9.634033203125, 10.26953125, 10.905029296875, 11.54052734375, 12.176025390625, 12.8115234375, 13.447021484375, 14.08251953125, 14.718017578125, 15.353515625, 15.989013671875, 16.62451171875, 17.260009765625, 17.8955078125, 18.531005859375, 19.16650390625, 19.802001953125, 20.4375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 11.0, 8.0, 8.0, 11.0, 15.0, 25.0, 19.0, 25.0, 20.0, 33.0, 36.0, 23.0, 31.0, 35.0, 39.0, 44.0, 39.0, 47.0, 51.0, 45.0, 28.0, 39.0, 38.0, 45.0, 33.0, 42.0, 24.0, 32.0, 20.0, 22.0, 17.0, 15.0, 10.0, 12.0, 9.0, 5.0, 10.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.047607421875, -9.69677734375, -9.345947265625, -8.9951171875, -8.644287109375, -8.29345703125, -7.942626953125, -7.591796875, -7.240966796875, -6.89013671875, -6.539306640625, -6.1884765625, -5.837646484375, -5.48681640625, -5.135986328125, -4.78515625, -4.434326171875, -4.08349609375, -3.732666015625, -3.3818359375, -3.031005859375, -2.68017578125, -2.329345703125, -1.978515625, -1.627685546875, -1.27685546875, -0.926025390625, -0.5751953125, -0.224365234375, 0.12646484375, 0.477294921875, 0.828125, 1.178955078125, 1.52978515625, 1.880615234375, 2.2314453125, 2.582275390625, 2.93310546875, 3.283935546875, 3.634765625, 3.985595703125, 4.33642578125, 4.687255859375, 5.0380859375, 5.388916015625, 5.73974609375, 6.090576171875, 6.44140625, 6.792236328125, 7.14306640625, 7.493896484375, 7.8447265625, 8.195556640625, 8.54638671875, 8.897216796875, 9.248046875, 9.598876953125, 9.94970703125, 10.300537109375, 10.6513671875, 11.002197265625, 11.35302734375, 11.703857421875, 12.0546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 13.0, 7.0, 15.0, 21.0, 21.0, 43.0, 63.0, 82.0, 109.0, 148.0, 255.0, 470.0, 881.0, 1911.0, 4782.0, 15182.0, 113771.0, 877510.0, 21996.0, 6358.0, 2371.0, 1062.0, 547.0, 291.0, 194.0, 144.0, 77.0, 52.0, 44.0, 27.0, 21.0, 19.0, 17.0, 9.0, 3.0, 6.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.478515625, -2.401397705078125, -2.32427978515625, -2.247161865234375, -2.1700439453125, -2.092926025390625, -2.01580810546875, -1.938690185546875, -1.861572265625, -1.784454345703125, -1.70733642578125, -1.630218505859375, -1.5531005859375, -1.475982666015625, -1.39886474609375, -1.321746826171875, -1.24462890625, -1.167510986328125, -1.09039306640625, -1.013275146484375, -0.9361572265625, -0.859039306640625, -0.78192138671875, -0.704803466796875, -0.627685546875, -0.550567626953125, -0.47344970703125, -0.396331787109375, -0.3192138671875, -0.242095947265625, -0.16497802734375, -0.087860107421875, -0.0107421875, 0.066375732421875, 0.14349365234375, 0.220611572265625, 0.2977294921875, 0.374847412109375, 0.45196533203125, 0.529083251953125, 0.606201171875, 0.683319091796875, 0.76043701171875, 0.837554931640625, 0.9146728515625, 0.991790771484375, 1.06890869140625, 1.146026611328125, 1.22314453125, 1.300262451171875, 1.37738037109375, 1.454498291015625, 1.5316162109375, 1.608734130859375, 1.68585205078125, 1.762969970703125, 1.840087890625, 1.917205810546875, 1.99432373046875, 2.071441650390625, 2.1485595703125, 2.225677490234375, 2.30279541015625, 2.379913330078125, 2.45703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 12.0, 12.0, 22.0, 34.0, 28.0, 43.0, 43.0, 63.0, 71.0, 78.0, 89.0, 69.0, 78.0, 74.0, 47.0, 41.0, 32.0, 25.0, 18.0, 20.0, 13.0, 6.0, 13.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00010019540786743164, -9.726919233798981e-05, -9.434297680854797e-05, -9.141676127910614e-05, -8.84905457496643e-05, -8.556433022022247e-05, -8.263811469078064e-05, -7.97118991613388e-05, -7.678568363189697e-05, -7.385946810245514e-05, -7.09332525730133e-05, -6.800703704357147e-05, -6.508082151412964e-05, -6.21546059846878e-05, -5.922839045524597e-05, -5.630217492580414e-05, -5.3375959396362305e-05, -5.044974386692047e-05, -4.752352833747864e-05, -4.4597312808036804e-05, -4.167109727859497e-05, -3.874488174915314e-05, -3.5818666219711304e-05, -3.289245069026947e-05, -2.9966235160827637e-05, -2.7040019631385803e-05, -2.411380410194397e-05, -2.1187588572502136e-05, -1.8261373043060303e-05, -1.533515751361847e-05, -1.2408941984176636e-05, -9.482726454734802e-06, -6.556510925292969e-06, -3.6302953958511353e-06, -7.040798664093018e-07, 2.2221356630325317e-06, 5.148351192474365e-06, 8.074566721916199e-06, 1.1000782251358032e-05, 1.3926997780799866e-05, 1.68532133102417e-05, 1.9779428839683533e-05, 2.2705644369125366e-05, 2.56318598985672e-05, 2.8558075428009033e-05, 3.148429095745087e-05, 3.44105064868927e-05, 3.7336722016334534e-05, 4.026293754577637e-05, 4.31891530752182e-05, 4.6115368604660034e-05, 4.904158413410187e-05, 5.19677996635437e-05, 5.4894015192985535e-05, 5.782023072242737e-05, 6.07464462518692e-05, 6.367266178131104e-05, 6.659887731075287e-05, 6.95250928401947e-05, 7.245130836963654e-05, 7.537752389907837e-05, 7.83037394285202e-05, 8.122995495796204e-05, 8.415617048740387e-05, 8.70823860168457e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 10.0, 17.0, 28.0, 45.0, 46.0, 72.0, 88.0, 138.0, 242.0, 260.0, 439.0, 716.0, 985.0, 1606.0, 2622.0, 4642.0, 8802.0, 18326.0, 41479.0, 97150.0, 208848.0, 298741.0, 196944.0, 90855.0, 38240.0, 17392.0, 8282.0, 4460.0, 2575.0, 1498.0, 1022.0, 595.0, 426.0, 295.0, 228.0, 117.0, 112.0, 61.0, 50.0, 21.0, 17.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.869140625, -1.809722900390625, -1.75030517578125, -1.690887451171875, -1.6314697265625, -1.572052001953125, -1.51263427734375, -1.453216552734375, -1.393798828125, -1.334381103515625, -1.27496337890625, -1.215545654296875, -1.1561279296875, -1.096710205078125, -1.03729248046875, -0.977874755859375, -0.91845703125, -0.859039306640625, -0.79962158203125, -0.740203857421875, -0.6807861328125, -0.621368408203125, -0.56195068359375, -0.502532958984375, -0.443115234375, -0.383697509765625, -0.32427978515625, -0.264862060546875, -0.2054443359375, -0.146026611328125, -0.08660888671875, -0.027191162109375, 0.0322265625, 0.091644287109375, 0.15106201171875, 0.210479736328125, 0.2698974609375, 0.329315185546875, 0.38873291015625, 0.448150634765625, 0.507568359375, 0.566986083984375, 0.62640380859375, 0.685821533203125, 0.7452392578125, 0.804656982421875, 0.86407470703125, 0.923492431640625, 0.98291015625, 1.042327880859375, 1.10174560546875, 1.161163330078125, 1.2205810546875, 1.279998779296875, 1.33941650390625, 1.398834228515625, 1.458251953125, 1.517669677734375, 1.57708740234375, 1.636505126953125, 1.6959228515625, 1.755340576171875, 1.81475830078125, 1.874176025390625, 1.93359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 11.0, 6.0, 12.0, 10.0, 18.0, 32.0, 33.0, 31.0, 56.0, 60.0, 75.0, 79.0, 95.0, 101.0, 74.0, 62.0, 53.0, 56.0, 43.0, 20.0, 24.0, 9.0, 10.0, 10.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46533203125, -0.44701385498046875, -0.4286956787109375, -0.41037750244140625, -0.392059326171875, -0.37374114990234375, -0.3554229736328125, -0.33710479736328125, -0.31878662109375, -0.30046844482421875, -0.2821502685546875, -0.26383209228515625, -0.245513916015625, -0.22719573974609375, -0.2088775634765625, -0.19055938720703125, -0.1722412109375, -0.15392303466796875, -0.1356048583984375, -0.11728668212890625, -0.098968505859375, -0.08065032958984375, -0.0623321533203125, -0.04401397705078125, -0.02569580078125, -0.00737762451171875, 0.0109405517578125, 0.02925872802734375, 0.047576904296875, 0.06589508056640625, 0.0842132568359375, 0.10253143310546875, 0.120849609375, 0.13916778564453125, 0.1574859619140625, 0.17580413818359375, 0.194122314453125, 0.21244049072265625, 0.2307586669921875, 0.24907684326171875, 0.26739501953125, 0.28571319580078125, 0.3040313720703125, 0.32234954833984375, 0.340667724609375, 0.35898590087890625, 0.3773040771484375, 0.39562225341796875, 0.4139404296875, 0.43225860595703125, 0.4505767822265625, 0.46889495849609375, 0.487213134765625, 0.5055313110351562, 0.5238494873046875, 0.5421676635742188, 0.56048583984375, 0.5788040161132812, 0.5971221923828125, 0.6154403686523438, 0.633758544921875, 0.6520767211914062, 0.6703948974609375, 0.6887130737304688, 0.70703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 14.0, 13.0, 6.0, 14.0, 18.0, 13.0, 22.0, 21.0, 31.0, 34.0, 43.0, 41.0, 47.0, 38.0, 43.0, 50.0, 49.0, 56.0, 49.0, 51.0, 41.0, 43.0, 32.0, 34.0, 25.0, 33.0, 29.0, 15.0, 13.0, 11.0, 11.0, 8.0, 11.0, 2.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-20.51023292541504, -19.919540405273438, -19.328847885131836, -18.738155364990234, -18.147464752197266, -17.556772232055664, -16.966079711914062, -16.37538719177246, -15.78469467163086, -15.194002151489258, -14.603309631347656, -14.012618064880371, -13.42192554473877, -12.831233024597168, -12.240541458129883, -11.649848937988281, -11.05915641784668, -10.468463897705078, -9.877771377563477, -9.287079811096191, -8.69638729095459, -8.105694770812988, -7.515002727508545, -6.924310684204102, -6.3336181640625, -5.742925643920898, -5.152233600616455, -4.561541557312012, -3.97084903717041, -3.3801567554473877, -2.7894644737243652, -2.198772430419922, -1.6080780029296875, -1.017385721206665, -0.4266934394836426, 0.16399884223937988, 0.7546911239624023, 1.3453834056854248, 1.9360756874084473, 2.5267677307128906, 3.117460250854492, 3.7081525325775146, 4.298844814300537, 4.8895368576049805, 5.480229377746582, 6.070921897888184, 6.661613941192627, 7.25230598449707, 7.842998504638672, 8.433691024780273, 9.024383544921875, 9.61507511138916, 10.205767631530762, 10.796460151672363, 11.387151718139648, 11.97784423828125, 12.568536758422852, 13.159229278564453, 13.749921798706055, 14.34061336517334, 14.931305885314941, 15.521998405456543, 16.112689971923828, 16.70338249206543, 17.29407501220703]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 3.0, 9.0, 10.0, 13.0, 22.0, 16.0, 22.0, 25.0, 33.0, 30.0, 32.0, 43.0, 47.0, 48.0, 51.0, 52.0, 39.0, 44.0, 36.0, 52.0, 49.0, 29.0, 35.0, 44.0, 37.0, 32.0, 28.0, 29.0, 18.0, 25.0, 11.0, 11.0, 10.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.121078491210938, -20.501134872436523, -19.881189346313477, -19.261245727539062, -18.641300201416016, -18.0213565826416, -17.401411056518555, -16.78146743774414, -16.161521911621094, -15.541577339172363, -14.921632766723633, -14.301688194274902, -13.681743621826172, -13.061799049377441, -12.441854476928711, -11.821910858154297, -11.201966285705566, -10.582021713256836, -9.962077140808105, -9.342132568359375, -8.722187995910645, -8.102243423461914, -7.482299327850342, -6.862354755401611, -6.242410182952881, -5.62246561050415, -5.00252103805542, -4.382576942443848, -3.762632131576538, -3.1426875591278076, -2.5227432250976562, -1.9027986526489258, -1.2828540802001953, -0.6629095673561096, -0.042965054512023926, 0.576979398727417, 1.1969239711761475, 1.816868543624878, 2.4368128776550293, 3.0567574501037598, 3.6767020225524902, 4.296646595001221, 4.916591167449951, 5.536535263061523, 6.156479835510254, 6.776424407958984, 7.396368980407715, 8.016313552856445, 8.636258125305176, 9.256202697753906, 9.876147270202637, 10.496091842651367, 11.116036415100098, 11.735980987548828, 12.355924606323242, 12.975870132446289, 13.595813751220703, 14.215758323669434, 14.835702896118164, 15.455647468566895, 16.075592041015625, 16.69553565979004, 17.315481185913086, 17.9354248046875, 18.555370330810547]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 10.0, 18.0, 21.0, 19.0, 56.0, 58.0, 84.0, 153.0, 232.0, 315.0, 507.0, 809.0, 1224.0, 1860.0, 3126.0, 4933.0, 8125.0, 13310.0, 22242.0, 35294.0, 56007.0, 82729.0, 111818.0, 134880.0, 142595.0, 128090.0, 101655.0, 72562.0, 47660.0, 30061.0, 18635.0, 11205.0, 6797.0, 4191.0, 2675.0, 1712.0, 965.0, 676.0, 432.0, 289.0, 174.0, 111.0, 83.0, 50.0, 28.0, 19.0, 14.0, 15.0, 8.0, 1.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 5.0, 13.0, 13.0, 18.0, 23.0, 20.0, 20.0, 37.0, 29.0, 36.0, 45.0, 38.0, 47.0, 59.0, 51.0, 36.0, 43.0, 39.0, 48.0, 47.0, 33.0, 36.0, 44.0, 41.0, 27.0, 23.0, 27.0, 23.0, 19.0, 16.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.912353515625, -19.30908203125, -18.705810546875, -18.1025390625, -17.499267578125, -16.89599609375, -16.292724609375, -15.689453125, -15.086181640625, -14.48291015625, -13.879638671875, -13.2763671875, -12.673095703125, -12.06982421875, -11.466552734375, -10.86328125, -10.260009765625, -9.65673828125, -9.053466796875, -8.4501953125, -7.846923828125, -7.24365234375, -6.640380859375, -6.037109375, -5.433837890625, -4.83056640625, -4.227294921875, -3.6240234375, -3.020751953125, -2.41748046875, -1.814208984375, -1.2109375, -0.607666015625, -0.00439453125, 0.598876953125, 1.2021484375, 1.805419921875, 2.40869140625, 3.011962890625, 3.615234375, 4.218505859375, 4.82177734375, 5.425048828125, 6.0283203125, 6.631591796875, 7.23486328125, 7.838134765625, 8.44140625, 9.044677734375, 9.64794921875, 10.251220703125, 10.8544921875, 11.457763671875, 12.06103515625, 12.664306640625, 13.267578125, 13.870849609375, 14.47412109375, 15.077392578125, 15.6806640625, 16.283935546875, 16.88720703125, 17.490478515625, 18.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 9.0, 23.0, 18.0, 32.0, 48.0, 84.0, 128.0, 203.0, 276.0, 494.0, 765.0, 1184.0, 1936.0, 3232.0, 5568.0, 9548.0, 16760.0, 29738.0, 51739.0, 87075.0, 132070.0, 168528.0, 172393.0, 139316.0, 94008.0, 56871.0, 32555.0, 18262.0, 10408.0, 6029.0, 3543.0, 2111.0, 1338.0, 820.0, 521.0, 356.0, 190.0, 124.0, 88.0, 53.0, 39.0, 26.0, 16.0, 13.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.078125, -26.177978515625, -25.27783203125, -24.377685546875, -23.4775390625, -22.577392578125, -21.67724609375, -20.777099609375, -19.876953125, -18.976806640625, -18.07666015625, -17.176513671875, -16.2763671875, -15.376220703125, -14.47607421875, -13.575927734375, -12.67578125, -11.775634765625, -10.87548828125, -9.975341796875, -9.0751953125, -8.175048828125, -7.27490234375, -6.374755859375, -5.474609375, -4.574462890625, -3.67431640625, -2.774169921875, -1.8740234375, -0.973876953125, -0.07373046875, 0.826416015625, 1.7265625, 2.626708984375, 3.52685546875, 4.427001953125, 5.3271484375, 6.227294921875, 7.12744140625, 8.027587890625, 8.927734375, 9.827880859375, 10.72802734375, 11.628173828125, 12.5283203125, 13.428466796875, 14.32861328125, 15.228759765625, 16.12890625, 17.029052734375, 17.92919921875, 18.829345703125, 19.7294921875, 20.629638671875, 21.52978515625, 22.429931640625, 23.330078125, 24.230224609375, 25.13037109375, 26.030517578125, 26.9306640625, 27.830810546875, 28.73095703125, 29.631103515625, 30.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 1.0, 7.0, 2.0, 11.0, 2.0, 13.0, 15.0, 11.0, 18.0, 20.0, 18.0, 14.0, 26.0, 27.0, 34.0, 35.0, 38.0, 36.0, 44.0, 45.0, 31.0, 40.0, 41.0, 34.0, 40.0, 35.0, 47.0, 38.0, 36.0, 29.0, 24.0, 25.0, 28.0, 20.0, 19.0, 15.0, 18.0, 15.0, 15.0, 8.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.380615234375, -8.05029296875, -7.719970703125, -7.3896484375, -7.059326171875, -6.72900390625, -6.398681640625, -6.068359375, -5.738037109375, -5.40771484375, -5.077392578125, -4.7470703125, -4.416748046875, -4.08642578125, -3.756103515625, -3.42578125, -3.095458984375, -2.76513671875, -2.434814453125, -2.1044921875, -1.774169921875, -1.44384765625, -1.113525390625, -0.783203125, -0.452880859375, -0.12255859375, 0.207763671875, 0.5380859375, 0.868408203125, 1.19873046875, 1.529052734375, 1.859375, 2.189697265625, 2.52001953125, 2.850341796875, 3.1806640625, 3.510986328125, 3.84130859375, 4.171630859375, 4.501953125, 4.832275390625, 5.16259765625, 5.492919921875, 5.8232421875, 6.153564453125, 6.48388671875, 6.814208984375, 7.14453125, 7.474853515625, 7.80517578125, 8.135498046875, 8.4658203125, 8.796142578125, 9.12646484375, 9.456787109375, 9.787109375, 10.117431640625, 10.44775390625, 10.778076171875, 11.1083984375, 11.438720703125, 11.76904296875, 12.099365234375, 12.4296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 6.0, 12.0, 21.0, 25.0, 38.0, 64.0, 72.0, 103.0, 137.0, 196.0, 324.0, 446.0, 621.0, 968.0, 1309.0, 1976.0, 2962.0, 4349.0, 6750.0, 10155.0, 15735.0, 23949.0, 36895.0, 55979.0, 80572.0, 108088.0, 130340.0, 136305.0, 123227.0, 97454.0, 70580.0, 48111.0, 31588.0, 20135.0, 13222.0, 8559.0, 5575.0, 3697.0, 2568.0, 1692.0, 1101.0, 864.0, 558.0, 386.0, 289.0, 170.0, 124.0, 84.0, 64.0, 35.0, 23.0, 13.0, 19.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.3125, -4.16534423828125, -4.0181884765625, -3.87103271484375, -3.723876953125, -3.57672119140625, -3.4295654296875, -3.28240966796875, -3.13525390625, -2.98809814453125, -2.8409423828125, -2.69378662109375, -2.546630859375, -2.39947509765625, -2.2523193359375, -2.10516357421875, -1.9580078125, -1.81085205078125, -1.6636962890625, -1.51654052734375, -1.369384765625, -1.22222900390625, -1.0750732421875, -0.92791748046875, -0.78076171875, -0.63360595703125, -0.4864501953125, -0.33929443359375, -0.192138671875, -0.04498291015625, 0.1021728515625, 0.24932861328125, 0.396484375, 0.54364013671875, 0.6907958984375, 0.83795166015625, 0.985107421875, 1.13226318359375, 1.2794189453125, 1.42657470703125, 1.57373046875, 1.72088623046875, 1.8680419921875, 2.01519775390625, 2.162353515625, 2.30950927734375, 2.4566650390625, 2.60382080078125, 2.7509765625, 2.89813232421875, 3.0452880859375, 3.19244384765625, 3.339599609375, 3.48675537109375, 3.6339111328125, 3.78106689453125, 3.92822265625, 4.07537841796875, 4.2225341796875, 4.36968994140625, 4.516845703125, 4.66400146484375, 4.8111572265625, 4.95831298828125, 5.10546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 2.0, 12.0, 8.0, 22.0, 14.0, 20.0, 24.0, 31.0, 43.0, 41.0, 43.0, 43.0, 53.0, 49.0, 50.0, 53.0, 63.0, 53.0, 54.0, 49.0, 39.0, 31.0, 34.0, 30.0, 22.0, 25.0, 15.0, 10.0, 12.0, 5.0, 4.0, 7.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00061798095703125, -0.0005995109677314758, -0.0005810409784317017, -0.0005625709891319275, -0.0005441009998321533, -0.0005256310105323792, -0.000507161021232605, -0.0004886910319328308, -0.00047022104263305664, -0.00045175105333328247, -0.0004332810640335083, -0.00041481107473373413, -0.00039634108543395996, -0.0003778710961341858, -0.0003594011068344116, -0.00034093111753463745, -0.0003224611282348633, -0.0003039911389350891, -0.00028552114963531494, -0.00026705116033554077, -0.0002485811710357666, -0.00023011118173599243, -0.00021164119243621826, -0.0001931712031364441, -0.00017470121383666992, -0.00015623122453689575, -0.00013776123523712158, -0.00011929124593734741, -0.00010082125663757324, -8.235126733779907e-05, -6.38812780380249e-05, -4.541128873825073e-05, -2.6941299438476562e-05, -8.471310138702393e-06, 9.998679161071777e-06, 2.8468668460845947e-05, 4.693865776062012e-05, 6.540864706039429e-05, 8.387863636016846e-05, 0.00010234862565994263, 0.0001208186149597168, 0.00013928860425949097, 0.00015775859355926514, 0.0001762285828590393, 0.00019469857215881348, 0.00021316856145858765, 0.00023163855075836182, 0.000250108540058136, 0.00026857852935791016, 0.0002870485186576843, 0.0003055185079574585, 0.00032398849725723267, 0.00034245848655700684, 0.000360928475856781, 0.0003793984651565552, 0.00039786845445632935, 0.0004163384437561035, 0.0004348084330558777, 0.00045327842235565186, 0.000471748411655426, 0.0004902184009552002, 0.0005086883902549744, 0.0005271583795547485, 0.0005456283688545227, 0.0005640983581542969]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 15.0, 25.0, 32.0, 44.0, 71.0, 101.0, 160.0, 248.0, 373.0, 587.0, 914.0, 1346.0, 1995.0, 3249.0, 5051.0, 7831.0, 12122.0, 18975.0, 29749.0, 45453.0, 67500.0, 94879.0, 122283.0, 138508.0, 133624.0, 112476.0, 84316.0, 58314.0, 38401.0, 24856.0, 16118.0, 10337.0, 6660.0, 4204.0, 2699.0, 1786.0, 1185.0, 673.0, 488.0, 321.0, 218.0, 127.0, 85.0, 60.0, 36.0, 17.0, 14.0, 12.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.1171875, -4.9658203125, -4.814453125, -4.6630859375, -4.51171875, -4.3603515625, -4.208984375, -4.0576171875, -3.90625, -3.7548828125, -3.603515625, -3.4521484375, -3.30078125, -3.1494140625, -2.998046875, -2.8466796875, -2.6953125, -2.5439453125, -2.392578125, -2.2412109375, -2.08984375, -1.9384765625, -1.787109375, -1.6357421875, -1.484375, -1.3330078125, -1.181640625, -1.0302734375, -0.87890625, -0.7275390625, -0.576171875, -0.4248046875, -0.2734375, -0.1220703125, 0.029296875, 0.1806640625, 0.33203125, 0.4833984375, 0.634765625, 0.7861328125, 0.9375, 1.0888671875, 1.240234375, 1.3916015625, 1.54296875, 1.6943359375, 1.845703125, 1.9970703125, 2.1484375, 2.2998046875, 2.451171875, 2.6025390625, 2.75390625, 2.9052734375, 3.056640625, 3.2080078125, 3.359375, 3.5107421875, 3.662109375, 3.8134765625, 3.96484375, 4.1162109375, 4.267578125, 4.4189453125, 4.5703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 9.0, 11.0, 12.0, 21.0, 18.0, 18.0, 27.0, 19.0, 34.0, 25.0, 43.0, 34.0, 56.0, 51.0, 41.0, 36.0, 49.0, 55.0, 34.0, 43.0, 46.0, 42.0, 29.0, 31.0, 26.0, 33.0, 25.0, 22.0, 12.0, 9.0, 16.0, 8.0, 9.0, 7.0, 10.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.837890625, -1.781646728515625, -1.72540283203125, -1.669158935546875, -1.6129150390625, -1.556671142578125, -1.50042724609375, -1.444183349609375, -1.387939453125, -1.331695556640625, -1.27545166015625, -1.219207763671875, -1.1629638671875, -1.106719970703125, -1.05047607421875, -0.994232177734375, -0.93798828125, -0.881744384765625, -0.82550048828125, -0.769256591796875, -0.7130126953125, -0.656768798828125, -0.60052490234375, -0.544281005859375, -0.488037109375, -0.431793212890625, -0.37554931640625, -0.319305419921875, -0.2630615234375, -0.206817626953125, -0.15057373046875, -0.094329833984375, -0.0380859375, 0.018157958984375, 0.07440185546875, 0.130645751953125, 0.1868896484375, 0.243133544921875, 0.29937744140625, 0.355621337890625, 0.411865234375, 0.468109130859375, 0.52435302734375, 0.580596923828125, 0.6368408203125, 0.693084716796875, 0.74932861328125, 0.805572509765625, 0.86181640625, 0.918060302734375, 0.97430419921875, 1.030548095703125, 1.0867919921875, 1.143035888671875, 1.19927978515625, 1.255523681640625, 1.311767578125, 1.368011474609375, 1.42425537109375, 1.480499267578125, 1.5367431640625, 1.592987060546875, 1.64923095703125, 1.705474853515625, 1.76171875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 4.0, 3.0, 9.0, 6.0, 10.0, 12.0, 15.0, 21.0, 22.0, 29.0, 39.0, 33.0, 40.0, 44.0, 58.0, 61.0, 60.0, 58.0, 57.0, 53.0, 49.0, 51.0, 35.0, 38.0, 38.0, 24.0, 24.0, 28.0, 15.0, 13.0, 11.0, 7.0, 10.0, 6.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.08905601501465, -23.41295623779297, -22.736854553222656, -22.060752868652344, -21.384653091430664, -20.708553314208984, -20.032451629638672, -19.35634994506836, -18.68025016784668, -18.004150390625, -17.328048706054688, -16.651947021484375, -15.975847244262695, -15.2997465133667, -14.623645782470703, -13.947545051574707, -13.271444320678711, -12.595343589782715, -11.919242858886719, -11.243142127990723, -10.567041397094727, -9.89094066619873, -9.214839935302734, -8.538739204406738, -7.862638473510742, -7.186537742614746, -6.51043701171875, -5.834336280822754, -5.158235549926758, -4.482134819030762, -3.8060340881347656, -3.1299333572387695, -2.4538326263427734, -1.7777318954467773, -1.1016311645507812, -0.42553043365478516, 0.25057029724121094, 0.926671028137207, 1.6027717590332031, 2.278872489929199, 2.9549732208251953, 3.6310739517211914, 4.3071746826171875, 4.983275413513184, 5.65937614440918, 6.335476875305176, 7.011577606201172, 7.687678337097168, 8.363779067993164, 9.03987979888916, 9.715980529785156, 10.392081260681152, 11.068181991577148, 11.744282722473145, 12.42038345336914, 13.096484184265137, 13.772584915161133, 14.448685646057129, 15.124786376953125, 15.800887107849121, 16.476987838745117, 17.153087615966797, 17.82918930053711, 18.505290985107422, 19.1813907623291]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 9.0, 14.0, 27.0, 23.0, 29.0, 29.0, 46.0, 34.0, 38.0, 52.0, 45.0, 41.0, 39.0, 46.0, 55.0, 52.0, 46.0, 37.0, 35.0, 35.0, 40.0, 44.0, 28.0, 29.0, 22.0, 20.0, 15.0, 10.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734127044677734, -18.0801944732666, -17.426259994506836, -16.772327423095703, -16.118392944335938, -15.464460372924805, -14.810526847839355, -14.156593322753906, -13.502660751342773, -12.848727226257324, -12.194793701171875, -11.540861129760742, -10.886927604675293, -10.232994079589844, -9.579060554504395, -8.925127029418945, -8.271193504333496, -7.617259979248047, -6.963326930999756, -6.309393405914307, -5.655460357666016, -5.001526832580566, -4.347593307495117, -3.693660259246826, -3.039726734161377, -2.385793447494507, -1.7318600416183472, -1.0779266357421875, -0.4239933490753174, 0.22993993759155273, 0.883873462677002, 1.537806510925293, 2.191740036010742, 2.8456733226776123, 3.4996066093444824, 4.153540134429932, 4.807473182678223, 5.461406707763672, 6.115340232849121, 6.769273281097412, 7.423206806182861, 8.077139854431152, 8.731073379516602, 9.38500690460205, 10.0389404296875, 10.692873001098633, 11.346807479858398, 12.000740051269531, 12.65467357635498, 13.30860710144043, 13.962540626525879, 14.616474151611328, 15.270406723022461, 15.92434024810791, 16.57827377319336, 17.232206344604492, 17.886140823364258, 18.54007339477539, 19.194007873535156, 19.84794044494629, 20.501874923706055, 21.155807495117188, 21.809741973876953, 22.463674545288086, 23.11760711669922]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 7.0, 20.0, 26.0, 51.0, 87.0, 109.0, 228.0, 392.0, 592.0, 967.0, 1668.0, 2722.0, 4559.0, 7267.0, 11963.0, 19798.0, 32579.0, 54974.0, 91879.0, 155919.0, 265317.0, 430506.0, 620319.0, 717815.0, 636080.0, 450531.0, 278496.0, 165796.0, 96924.0, 57553.0, 34527.0, 21332.0, 12718.0, 8008.0, 4845.0, 2995.0, 1814.0, 1115.0, 683.0, 414.0, 256.0, 161.0, 90.0, 65.0, 41.0, 27.0, 14.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0], "bins": [-22.40625, -21.7578125, -21.109375, -20.4609375, -19.8125, -19.1640625, -18.515625, -17.8671875, -17.21875, -16.5703125, -15.921875, -15.2734375, -14.625, -13.9765625, -13.328125, -12.6796875, -12.03125, -11.3828125, -10.734375, -10.0859375, -9.4375, -8.7890625, -8.140625, -7.4921875, -6.84375, -6.1953125, -5.546875, -4.8984375, -4.25, -3.6015625, -2.953125, -2.3046875, -1.65625, -1.0078125, -0.359375, 0.2890625, 0.9375, 1.5859375, 2.234375, 2.8828125, 3.53125, 4.1796875, 4.828125, 5.4765625, 6.125, 6.7734375, 7.421875, 8.0703125, 8.71875, 9.3671875, 10.015625, 10.6640625, 11.3125, 11.9609375, 12.609375, 13.2578125, 13.90625, 14.5546875, 15.203125, 15.8515625, 16.5, 17.1484375, 17.796875, 18.4453125, 19.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 13.0, 28.0, 25.0, 23.0, 27.0, 42.0, 33.0, 47.0, 40.0, 50.0, 47.0, 29.0, 45.0, 48.0, 53.0, 53.0, 38.0, 39.0, 35.0, 37.0, 41.0, 33.0, 33.0, 23.0, 20.0, 14.0, 15.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.17578125, -15.6015625, -15.02734375, -14.453125, -13.87890625, -13.3046875, -12.73046875, -12.15625, -11.58203125, -11.0078125, -10.43359375, -9.859375, -9.28515625, -8.7109375, -8.13671875, -7.5625, -6.98828125, -6.4140625, -5.83984375, -5.265625, -4.69140625, -4.1171875, -3.54296875, -2.96875, -2.39453125, -1.8203125, -1.24609375, -0.671875, -0.09765625, 0.4765625, 1.05078125, 1.625, 2.19921875, 2.7734375, 3.34765625, 3.921875, 4.49609375, 5.0703125, 5.64453125, 6.21875, 6.79296875, 7.3671875, 7.94140625, 8.515625, 9.08984375, 9.6640625, 10.23828125, 10.8125, 11.38671875, 11.9609375, 12.53515625, 13.109375, 13.68359375, 14.2578125, 14.83203125, 15.40625, 15.98046875, 16.5546875, 17.12890625, 17.703125, 18.27734375, 18.8515625, 19.42578125, 20.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 9.0, 5.0, 18.0, 18.0, 31.0, 45.0, 81.0, 105.0, 213.0, 269.0, 507.0, 872.0, 1441.0, 2321.0, 4110.0, 7654.0, 13849.0, 25236.0, 46433.0, 86345.0, 161349.0, 294324.0, 501995.0, 734271.0, 802834.0, 630033.0, 395009.0, 222905.0, 120339.0, 64281.0, 34624.0, 18709.0, 10473.0, 5724.0, 3197.0, 1871.0, 1095.0, 648.0, 375.0, 242.0, 151.0, 104.0, 63.0, 29.0, 30.0, 21.0, 8.0, 4.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.21875, -21.45947265625, -20.7001953125, -19.94091796875, -19.181640625, -18.42236328125, -17.6630859375, -16.90380859375, -16.14453125, -15.38525390625, -14.6259765625, -13.86669921875, -13.107421875, -12.34814453125, -11.5888671875, -10.82958984375, -10.0703125, -9.31103515625, -8.5517578125, -7.79248046875, -7.033203125, -6.27392578125, -5.5146484375, -4.75537109375, -3.99609375, -3.23681640625, -2.4775390625, -1.71826171875, -0.958984375, -0.19970703125, 0.5595703125, 1.31884765625, 2.078125, 2.83740234375, 3.5966796875, 4.35595703125, 5.115234375, 5.87451171875, 6.6337890625, 7.39306640625, 8.15234375, 8.91162109375, 9.6708984375, 10.43017578125, 11.189453125, 11.94873046875, 12.7080078125, 13.46728515625, 14.2265625, 14.98583984375, 15.7451171875, 16.50439453125, 17.263671875, 18.02294921875, 18.7822265625, 19.54150390625, 20.30078125, 21.06005859375, 21.8193359375, 22.57861328125, 23.337890625, 24.09716796875, 24.8564453125, 25.61572265625, 26.375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 8.0, 14.0, 14.0, 21.0, 17.0, 29.0, 37.0, 52.0, 51.0, 70.0, 80.0, 106.0, 123.0, 131.0, 170.0, 202.0, 206.0, 233.0, 234.0, 261.0, 236.0, 248.0, 231.0, 200.0, 173.0, 171.0, 135.0, 100.0, 83.0, 83.0, 54.0, 75.0, 59.0, 34.0, 29.0, 24.0, 16.0, 15.0, 12.0, 10.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.703125, -8.4404296875, -8.177734375, -7.9150390625, -7.65234375, -7.3896484375, -7.126953125, -6.8642578125, -6.6015625, -6.3388671875, -6.076171875, -5.8134765625, -5.55078125, -5.2880859375, -5.025390625, -4.7626953125, -4.5, -4.2373046875, -3.974609375, -3.7119140625, -3.44921875, -3.1865234375, -2.923828125, -2.6611328125, -2.3984375, -2.1357421875, -1.873046875, -1.6103515625, -1.34765625, -1.0849609375, -0.822265625, -0.5595703125, -0.296875, -0.0341796875, 0.228515625, 0.4912109375, 0.75390625, 1.0166015625, 1.279296875, 1.5419921875, 1.8046875, 2.0673828125, 2.330078125, 2.5927734375, 2.85546875, 3.1181640625, 3.380859375, 3.6435546875, 3.90625, 4.1689453125, 4.431640625, 4.6943359375, 4.95703125, 5.2197265625, 5.482421875, 5.7451171875, 6.0078125, 6.2705078125, 6.533203125, 6.7958984375, 7.05859375, 7.3212890625, 7.583984375, 7.8466796875, 8.109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 8.0, 6.0, 19.0, 15.0, 19.0, 20.0, 21.0, 25.0, 36.0, 41.0, 39.0, 50.0, 47.0, 51.0, 53.0, 67.0, 34.0, 48.0, 46.0, 30.0, 43.0, 30.0, 27.0, 25.0, 28.0, 21.0, 21.0, 27.0, 20.0, 12.0, 13.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.556360244750977, -18.9261474609375, -18.295934677124023, -17.665721893310547, -17.03550910949707, -16.405296325683594, -15.775084495544434, -15.144871711730957, -14.51465892791748, -13.884446144104004, -13.254233360290527, -12.62402057647705, -11.99380874633789, -11.363595962524414, -10.733383178710938, -10.103170394897461, -9.472957611083984, -8.842744827270508, -8.212532043457031, -7.582319736480713, -6.952106952667236, -6.32189416885376, -5.691681861877441, -5.061469078063965, -4.431256294250488, -3.8010435104370117, -3.1708309650421143, -2.540618419647217, -1.9104056358337402, -1.2801928520202637, -0.6499803066253662, -0.01976776123046875, 0.6104469299316406, 1.2406595945358276, 1.8708722591400146, 2.501084804534912, 3.1312975883483887, 3.7615103721618652, 4.391722679138184, 5.02193546295166, 5.652148246765137, 6.282361030578613, 6.91257381439209, 7.542786121368408, 8.172998428344727, 8.803211212158203, 9.43342399597168, 10.063636779785156, 10.693849563598633, 11.32406234741211, 11.954275131225586, 12.584487915039062, 13.214700698852539, 13.844913482666016, 14.475125312805176, 15.105338096618652, 15.735550880432129, 16.36576271057129, 16.995975494384766, 17.626188278198242, 18.25640106201172, 18.886613845825195, 19.516826629638672, 20.14703941345215, 20.777252197265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 9.0, 13.0, 6.0, 20.0, 21.0, 27.0, 29.0, 30.0, 41.0, 34.0, 36.0, 52.0, 39.0, 60.0, 39.0, 41.0, 32.0, 44.0, 45.0, 43.0, 41.0, 36.0, 34.0, 29.0, 35.0, 27.0, 15.0, 17.0, 16.0, 11.0, 15.0, 7.0, 8.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.36700439453125, -16.73833656311035, -16.109668731689453, -15.481000900268555, -14.852333068847656, -14.223665237426758, -13.594998359680176, -12.966330528259277, -12.337662696838379, -11.70899486541748, -11.080327033996582, -10.451659202575684, -9.822992324829102, -9.194324493408203, -8.565656661987305, -7.936988830566406, -7.308320999145508, -6.679653167724609, -6.050985336303711, -5.422317981719971, -4.793650150299072, -4.164982318878174, -3.5363147258758545, -2.907647132873535, -2.2789793014526367, -1.6503115892410278, -1.021643877029419, -0.39297616481781006, 0.23569154739379883, 0.8643593788146973, 1.4930269718170166, 2.121694564819336, 2.7503604888916016, 3.3790283203125, 4.007696151733398, 4.636363506317139, 5.265031337738037, 5.8936991691589355, 6.522366523742676, 7.151034355163574, 7.779702186584473, 8.408370018005371, 9.03703784942627, 9.665705680847168, 10.29437255859375, 10.923040390014648, 11.551708221435547, 12.180376052856445, 12.809043884277344, 13.437711715698242, 14.06637954711914, 14.695047378540039, 15.323715209960938, 15.952383041381836, 16.581050872802734, 17.209716796875, 17.83838653564453, 18.46705436706543, 19.095722198486328, 19.724390029907227, 20.353057861328125, 20.981725692749023, 21.610393524169922, 22.239059448242188, 22.867727279663086]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 15.0, 20.0, 32.0, 45.0, 69.0, 88.0, 155.0, 231.0, 343.0, 526.0, 745.0, 1234.0, 1809.0, 2685.0, 4290.0, 6668.0, 10294.0, 16160.0, 25090.0, 39195.0, 59423.0, 86717.0, 115382.0, 136243.0, 139457.0, 121552.0, 92839.0, 65307.0, 43573.0, 28046.0, 17980.0, 11471.0, 7323.0, 4736.0, 2974.0, 2008.0, 1282.0, 873.0, 562.0, 404.0, 231.0, 146.0, 113.0, 79.0, 50.0, 28.0, 18.0, 19.0, 9.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.90625, -9.587890625, -9.26953125, -8.951171875, -8.6328125, -8.314453125, -7.99609375, -7.677734375, -7.359375, -7.041015625, -6.72265625, -6.404296875, -6.0859375, -5.767578125, -5.44921875, -5.130859375, -4.8125, -4.494140625, -4.17578125, -3.857421875, -3.5390625, -3.220703125, -2.90234375, -2.583984375, -2.265625, -1.947265625, -1.62890625, -1.310546875, -0.9921875, -0.673828125, -0.35546875, -0.037109375, 0.28125, 0.599609375, 0.91796875, 1.236328125, 1.5546875, 1.873046875, 2.19140625, 2.509765625, 2.828125, 3.146484375, 3.46484375, 3.783203125, 4.1015625, 4.419921875, 4.73828125, 5.056640625, 5.375, 5.693359375, 6.01171875, 6.330078125, 6.6484375, 6.966796875, 7.28515625, 7.603515625, 7.921875, 8.240234375, 8.55859375, 8.876953125, 9.1953125, 9.513671875, 9.83203125, 10.150390625, 10.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 10.0, 10.0, 8.0, 13.0, 18.0, 17.0, 27.0, 20.0, 31.0, 37.0, 38.0, 38.0, 28.0, 51.0, 53.0, 53.0, 43.0, 35.0, 38.0, 42.0, 44.0, 35.0, 45.0, 41.0, 32.0, 31.0, 32.0, 20.0, 17.0, 10.0, 15.0, 15.0, 11.0, 8.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.17578125, -17.5078125, -16.83984375, -16.171875, -15.50390625, -14.8359375, -14.16796875, -13.5, -12.83203125, -12.1640625, -11.49609375, -10.828125, -10.16015625, -9.4921875, -8.82421875, -8.15625, -7.48828125, -6.8203125, -6.15234375, -5.484375, -4.81640625, -4.1484375, -3.48046875, -2.8125, -2.14453125, -1.4765625, -0.80859375, -0.140625, 0.52734375, 1.1953125, 1.86328125, 2.53125, 3.19921875, 3.8671875, 4.53515625, 5.203125, 5.87109375, 6.5390625, 7.20703125, 7.875, 8.54296875, 9.2109375, 9.87890625, 10.546875, 11.21484375, 11.8828125, 12.55078125, 13.21875, 13.88671875, 14.5546875, 15.22265625, 15.890625, 16.55859375, 17.2265625, 17.89453125, 18.5625, 19.23046875, 19.8984375, 20.56640625, 21.234375, 21.90234375, 22.5703125, 23.23828125, 23.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 5.0, 11.0, 15.0, 23.0, 24.0, 48.0, 64.0, 106.0, 146.0, 244.0, 316.0, 458.0, 661.0, 921.0, 1361.0, 2029.0, 2961.0, 4400.0, 6965.0, 11065.0, 17233.0, 30391.0, 283939.0, 596326.0, 35195.0, 19606.0, 11785.0, 7439.0, 4827.0, 3192.0, 2169.0, 1398.0, 974.0, 696.0, 455.0, 359.0, 232.0, 168.0, 113.0, 73.0, 47.0, 45.0, 28.0, 12.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-21.65625, -21.021240234375, -20.38623046875, -19.751220703125, -19.1162109375, -18.481201171875, -17.84619140625, -17.211181640625, -16.576171875, -15.941162109375, -15.30615234375, -14.671142578125, -14.0361328125, -13.401123046875, -12.76611328125, -12.131103515625, -11.49609375, -10.861083984375, -10.22607421875, -9.591064453125, -8.9560546875, -8.321044921875, -7.68603515625, -7.051025390625, -6.416015625, -5.781005859375, -5.14599609375, -4.510986328125, -3.8759765625, -3.240966796875, -2.60595703125, -1.970947265625, -1.3359375, -0.700927734375, -0.06591796875, 0.569091796875, 1.2041015625, 1.839111328125, 2.47412109375, 3.109130859375, 3.744140625, 4.379150390625, 5.01416015625, 5.649169921875, 6.2841796875, 6.919189453125, 7.55419921875, 8.189208984375, 8.82421875, 9.459228515625, 10.09423828125, 10.729248046875, 11.3642578125, 11.999267578125, 12.63427734375, 13.269287109375, 13.904296875, 14.539306640625, 15.17431640625, 15.809326171875, 16.4443359375, 17.079345703125, 17.71435546875, 18.349365234375, 18.984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 7.0, 2.0, 6.0, 5.0, 4.0, 14.0, 9.0, 15.0, 14.0, 16.0, 29.0, 25.0, 29.0, 30.0, 23.0, 32.0, 45.0, 25.0, 36.0, 34.0, 39.0, 42.0, 42.0, 34.0, 34.0, 44.0, 31.0, 53.0, 30.0, 22.0, 35.0, 26.0, 15.0, 20.0, 20.0, 21.0, 20.0, 10.0, 11.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.359375, -12.9268798828125, -12.494384765625, -12.0618896484375, -11.62939453125, -11.1968994140625, -10.764404296875, -10.3319091796875, -9.8994140625, -9.4669189453125, -9.034423828125, -8.6019287109375, -8.16943359375, -7.7369384765625, -7.304443359375, -6.8719482421875, -6.439453125, -6.0069580078125, -5.574462890625, -5.1419677734375, -4.70947265625, -4.2769775390625, -3.844482421875, -3.4119873046875, -2.9794921875, -2.5469970703125, -2.114501953125, -1.6820068359375, -1.24951171875, -0.8170166015625, -0.384521484375, 0.0479736328125, 0.48046875, 0.9129638671875, 1.345458984375, 1.7779541015625, 2.21044921875, 2.6429443359375, 3.075439453125, 3.5079345703125, 3.9404296875, 4.3729248046875, 4.805419921875, 5.2379150390625, 5.67041015625, 6.1029052734375, 6.535400390625, 6.9678955078125, 7.400390625, 7.8328857421875, 8.265380859375, 8.6978759765625, 9.13037109375, 9.5628662109375, 9.995361328125, 10.4278564453125, 10.8603515625, 11.2928466796875, 11.725341796875, 12.1578369140625, 12.59033203125, 13.0228271484375, 13.455322265625, 13.8878173828125, 14.3203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 11.0, 11.0, 18.0, 21.0, 32.0, 52.0, 59.0, 114.0, 154.0, 218.0, 353.0, 550.0, 1031.0, 1944.0, 3855.0, 7992.0, 18432.0, 58789.0, 867058.0, 54098.0, 17713.0, 7715.0, 3806.0, 1901.0, 1060.0, 581.0, 334.0, 219.0, 137.0, 101.0, 62.0, 41.0, 17.0, 25.0, 16.0, 10.0, 3.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8759765625, -1.821563720703125, -1.76715087890625, -1.712738037109375, -1.6583251953125, -1.603912353515625, -1.54949951171875, -1.495086669921875, -1.440673828125, -1.386260986328125, -1.33184814453125, -1.277435302734375, -1.2230224609375, -1.168609619140625, -1.11419677734375, -1.059783935546875, -1.00537109375, -0.950958251953125, -0.89654541015625, -0.842132568359375, -0.7877197265625, -0.733306884765625, -0.67889404296875, -0.624481201171875, -0.570068359375, -0.515655517578125, -0.46124267578125, -0.406829833984375, -0.3524169921875, -0.298004150390625, -0.24359130859375, -0.189178466796875, -0.134765625, -0.080352783203125, -0.02593994140625, 0.028472900390625, 0.0828857421875, 0.137298583984375, 0.19171142578125, 0.246124267578125, 0.300537109375, 0.354949951171875, 0.40936279296875, 0.463775634765625, 0.5181884765625, 0.572601318359375, 0.62701416015625, 0.681427001953125, 0.73583984375, 0.790252685546875, 0.84466552734375, 0.899078369140625, 0.9534912109375, 1.007904052734375, 1.06231689453125, 1.116729736328125, 1.171142578125, 1.225555419921875, 1.27996826171875, 1.334381103515625, 1.3887939453125, 1.443206787109375, 1.49761962890625, 1.552032470703125, 1.6064453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 14.0, 6.0, 14.0, 19.0, 18.0, 31.0, 20.0, 45.0, 52.0, 56.0, 75.0, 88.0, 71.0, 71.0, 76.0, 64.0, 59.0, 58.0, 39.0, 26.0, 22.0, 20.0, 13.0, 10.0, 6.0, 4.0, 1.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002963542938232422, -0.0002873167395591736, -0.000278279185295105, -0.0002692416310310364, -0.0002602040767669678, -0.00025116652250289917, -0.00024212896823883057, -0.00023309141397476196, -0.00022405385971069336, -0.00021501630544662476, -0.00020597875118255615, -0.00019694119691848755, -0.00018790364265441895, -0.00017886608839035034, -0.00016982853412628174, -0.00016079097986221313, -0.00015175342559814453, -0.00014271587133407593, -0.00013367831707000732, -0.00012464076280593872, -0.00011560320854187012, -0.00010656565427780151, -9.752810001373291e-05, -8.84905457496643e-05, -7.94529914855957e-05, -7.04154372215271e-05, -6.13778829574585e-05, -5.234032869338989e-05, -4.330277442932129e-05, -3.4265220165252686e-05, -2.5227665901184082e-05, -1.619011163711548e-05, -7.152557373046875e-06, 1.8849968910217285e-06, 1.0922551155090332e-05, 1.9960105419158936e-05, 2.899765968322754e-05, 3.803521394729614e-05, 4.7072768211364746e-05, 5.611032247543335e-05, 6.514787673950195e-05, 7.418543100357056e-05, 8.322298526763916e-05, 9.226053953170776e-05, 0.00010129809379577637, 0.00011033564805984497, 0.00011937320232391357, 0.00012841075658798218, 0.00013744831085205078, 0.00014648586511611938, 0.000155523419380188, 0.0001645609736442566, 0.0001735985279083252, 0.0001826360821723938, 0.0001916736364364624, 0.000200711190700531, 0.0002097487449645996, 0.0002187862992286682, 0.00022782385349273682, 0.00023686140775680542, 0.000245898962020874, 0.0002549365162849426, 0.00026397407054901123, 0.00027301162481307983, 0.00028204917907714844]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 4.0, 18.0, 14.0, 25.0, 34.0, 54.0, 95.0, 130.0, 171.0, 288.0, 386.0, 609.0, 917.0, 1429.0, 1992.0, 2965.0, 4434.0, 6688.0, 10185.0, 15896.0, 24896.0, 41115.0, 68728.0, 116668.0, 176108.0, 196100.0, 147268.0, 89765.0, 52636.0, 31821.0, 19809.0, 12618.0, 8177.0, 5420.0, 3590.0, 2418.0, 1599.0, 1118.0, 776.0, 477.0, 344.0, 244.0, 181.0, 109.0, 82.0, 49.0, 40.0, 18.0, 23.0, 5.0, 3.0, 3.0, 7.0, 2.0, 3.0], "bins": [-0.84423828125, -0.8195877075195312, -0.7949371337890625, -0.7702865600585938, -0.745635986328125, -0.7209854125976562, -0.6963348388671875, -0.6716842651367188, -0.64703369140625, -0.6223831176757812, -0.5977325439453125, -0.5730819702148438, -0.548431396484375, -0.5237808227539062, -0.4991302490234375, -0.47447967529296875, -0.4498291015625, -0.42517852783203125, -0.4005279541015625, -0.37587738037109375, -0.351226806640625, -0.32657623291015625, -0.3019256591796875, -0.27727508544921875, -0.25262451171875, -0.22797393798828125, -0.2033233642578125, -0.17867279052734375, -0.154022216796875, -0.12937164306640625, -0.1047210693359375, -0.08007049560546875, -0.055419921875, -0.03076934814453125, -0.0061187744140625, 0.01853179931640625, 0.043182373046875, 0.06783294677734375, 0.0924835205078125, 0.11713409423828125, 0.14178466796875, 0.16643524169921875, 0.1910858154296875, 0.21573638916015625, 0.240386962890625, 0.26503753662109375, 0.2896881103515625, 0.31433868408203125, 0.3389892578125, 0.36363983154296875, 0.3882904052734375, 0.41294097900390625, 0.437591552734375, 0.46224212646484375, 0.4868927001953125, 0.5115432739257812, 0.53619384765625, 0.5608444213867188, 0.5854949951171875, 0.6101455688476562, 0.634796142578125, 0.6594467163085938, 0.6840972900390625, 0.7087478637695312, 0.7333984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 9.0, 7.0, 9.0, 4.0, 7.0, 10.0, 7.0, 22.0, 22.0, 26.0, 26.0, 47.0, 48.0, 59.0, 58.0, 77.0, 74.0, 70.0, 55.0, 64.0, 58.0, 41.0, 34.0, 40.0, 34.0, 22.0, 12.0, 16.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.25099945068359375, -0.2422332763671875, -0.23346710205078125, -0.224700927734375, -0.21593475341796875, -0.2071685791015625, -0.19840240478515625, -0.18963623046875, -0.18087005615234375, -0.1721038818359375, -0.16333770751953125, -0.154571533203125, -0.14580535888671875, -0.1370391845703125, -0.12827301025390625, -0.1195068359375, -0.11074066162109375, -0.1019744873046875, -0.09320831298828125, -0.084442138671875, -0.07567596435546875, -0.0669097900390625, -0.05814361572265625, -0.04937744140625, -0.04061126708984375, -0.0318450927734375, -0.02307891845703125, -0.014312744140625, -0.00554656982421875, 0.0032196044921875, 0.01198577880859375, 0.020751953125, 0.02951812744140625, 0.0382843017578125, 0.04705047607421875, 0.055816650390625, 0.06458282470703125, 0.0733489990234375, 0.08211517333984375, 0.09088134765625, 0.09964752197265625, 0.1084136962890625, 0.11717987060546875, 0.125946044921875, 0.13471221923828125, 0.1434783935546875, 0.15224456787109375, 0.1610107421875, 0.16977691650390625, 0.1785430908203125, 0.18730926513671875, 0.196075439453125, 0.20484161376953125, 0.2136077880859375, 0.22237396240234375, 0.23114013671875, 0.23990631103515625, 0.2486724853515625, 0.25743865966796875, 0.266204833984375, 0.27497100830078125, 0.2837371826171875, 0.29250335693359375, 0.30126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 2.0, 7.0, 10.0, 9.0, 19.0, 17.0, 27.0, 27.0, 32.0, 33.0, 48.0, 55.0, 50.0, 63.0, 56.0, 56.0, 69.0, 56.0, 38.0, 56.0, 39.0, 26.0, 24.0, 33.0, 34.0, 26.0, 24.0, 13.0, 12.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.31647491455078, -21.541765213012695, -20.767053604125977, -19.99234390258789, -19.217632293701172, -18.442922592163086, -17.668212890625, -16.89350128173828, -16.118791580200195, -15.344080924987793, -14.56937026977539, -13.794660568237305, -13.019949913024902, -12.2452392578125, -11.470529556274414, -10.695818901062012, -9.92110824584961, -9.146397590637207, -8.371686935424805, -7.596977233886719, -6.822266578674316, -6.047555923461914, -5.27284574508667, -4.498135566711426, -3.7234249114990234, -2.9487144947052, -2.174004077911377, -1.3992936611175537, -0.6245832443237305, 0.15012717247009277, 0.924837589263916, 1.6995477676391602, 2.4742584228515625, 3.2489688396453857, 4.023679256439209, 4.798389434814453, 5.5731000900268555, 6.347810745239258, 7.122520923614502, 7.897231101989746, 8.671941757202148, 9.44665241241455, 10.221363067626953, 10.996072769165039, 11.770783424377441, 12.545494079589844, 13.32020378112793, 14.094914436340332, 14.869625091552734, 15.644335746765137, 16.41904640197754, 17.193756103515625, 17.968467712402344, 18.74317741394043, 19.517887115478516, 20.292598724365234, 21.06730842590332, 21.842018127441406, 22.616729736328125, 23.39143943786621, 24.166149139404297, 24.940860748291016, 25.7155704498291, 26.490280151367188, 27.264991760253906]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 9.0, 10.0, 11.0, 19.0, 22.0, 24.0, 22.0, 36.0, 30.0, 41.0, 40.0, 32.0, 58.0, 47.0, 55.0, 34.0, 39.0, 36.0, 49.0, 36.0, 35.0, 46.0, 41.0, 34.0, 31.0, 25.0, 17.0, 20.0, 10.0, 14.0, 16.0, 10.0, 8.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.66037368774414, -17.99193572998047, -17.323497772216797, -16.655059814453125, -15.98662281036377, -15.318184852600098, -14.649747848510742, -13.98130989074707, -13.312871932983398, -12.644433975219727, -11.975996017456055, -11.3075590133667, -10.639121055603027, -9.970683097839355, -9.30224609375, -8.633808135986328, -7.965370178222656, -7.296932220458984, -6.628494739532471, -5.960057258605957, -5.291619300842285, -4.623181343078613, -3.9547438621520996, -3.286306381225586, -2.617868423461914, -1.9494307041168213, -1.2809929847717285, -0.6125552654266357, 0.05588245391845703, 0.7243201732635498, 1.3927578926086426, 2.0611953735351562, 2.729633331298828, 3.398071050643921, 4.066508769989014, 4.734946250915527, 5.403384208679199, 6.071822166442871, 6.740259647369385, 7.408697128295898, 8.07713508605957, 8.745573043823242, 9.414011001586914, 10.08244800567627, 10.750885963439941, 11.419323921203613, 12.087760925292969, 12.75619888305664, 13.424636840820312, 14.093074798583984, 14.761512756347656, 15.429949760437012, 16.098388671875, 16.76682472229004, 17.43526268005371, 18.103700637817383, 18.772138595581055, 19.440576553344727, 20.1090145111084, 20.77745246887207, 21.44588851928711, 22.11432647705078, 22.782764434814453, 23.451202392578125, 24.119640350341797]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 15.0, 14.0, 26.0, 42.0, 51.0, 84.0, 98.0, 161.0, 236.0, 341.0, 499.0, 702.0, 1126.0, 1862.0, 2810.0, 4770.0, 7624.0, 12655.0, 21225.0, 35115.0, 56451.0, 86090.0, 120935.0, 148436.0, 152639.0, 130888.0, 96131.0, 64223.0, 40337.0, 24798.0, 14404.0, 8784.0, 5532.0, 3402.0, 2100.0, 1310.0, 881.0, 570.0, 354.0, 268.0, 174.0, 126.0, 97.0, 46.0, 36.0, 24.0, 22.0, 15.0, 14.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-22.578125, -21.89697265625, -21.2158203125, -20.53466796875, -19.853515625, -19.17236328125, -18.4912109375, -17.81005859375, -17.12890625, -16.44775390625, -15.7666015625, -15.08544921875, -14.404296875, -13.72314453125, -13.0419921875, -12.36083984375, -11.6796875, -10.99853515625, -10.3173828125, -9.63623046875, -8.955078125, -8.27392578125, -7.5927734375, -6.91162109375, -6.23046875, -5.54931640625, -4.8681640625, -4.18701171875, -3.505859375, -2.82470703125, -2.1435546875, -1.46240234375, -0.78125, -0.10009765625, 0.5810546875, 1.26220703125, 1.943359375, 2.62451171875, 3.3056640625, 3.98681640625, 4.66796875, 5.34912109375, 6.0302734375, 6.71142578125, 7.392578125, 8.07373046875, 8.7548828125, 9.43603515625, 10.1171875, 10.79833984375, 11.4794921875, 12.16064453125, 12.841796875, 13.52294921875, 14.2041015625, 14.88525390625, 15.56640625, 16.24755859375, 16.9287109375, 17.60986328125, 18.291015625, 18.97216796875, 19.6533203125, 20.33447265625, 21.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 10.0, 14.0, 11.0, 14.0, 4.0, 8.0, 21.0, 32.0, 22.0, 31.0, 34.0, 37.0, 38.0, 50.0, 42.0, 44.0, 45.0, 43.0, 38.0, 40.0, 46.0, 39.0, 38.0, 46.0, 32.0, 34.0, 29.0, 25.0, 30.0, 18.0, 12.0, 19.0, 10.0, 7.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8515625, -15.2686767578125, -14.685791015625, -14.1029052734375, -13.52001953125, -12.9371337890625, -12.354248046875, -11.7713623046875, -11.1884765625, -10.6055908203125, -10.022705078125, -9.4398193359375, -8.85693359375, -8.2740478515625, -7.691162109375, -7.1082763671875, -6.525390625, -5.9425048828125, -5.359619140625, -4.7767333984375, -4.19384765625, -3.6109619140625, -3.028076171875, -2.4451904296875, -1.8623046875, -1.2794189453125, -0.696533203125, -0.1136474609375, 0.46923828125, 1.0521240234375, 1.635009765625, 2.2178955078125, 2.80078125, 3.3836669921875, 3.966552734375, 4.5494384765625, 5.13232421875, 5.7152099609375, 6.298095703125, 6.8809814453125, 7.4638671875, 8.0467529296875, 8.629638671875, 9.2125244140625, 9.79541015625, 10.3782958984375, 10.961181640625, 11.5440673828125, 12.126953125, 12.7098388671875, 13.292724609375, 13.8756103515625, 14.45849609375, 15.0413818359375, 15.624267578125, 16.2071533203125, 16.7900390625, 17.3729248046875, 17.955810546875, 18.5386962890625, 19.12158203125, 19.7044677734375, 20.287353515625, 20.8702392578125, 21.453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 9.0, 13.0, 25.0, 33.0, 55.0, 61.0, 100.0, 135.0, 215.0, 317.0, 535.0, 819.0, 1344.0, 2178.0, 3625.0, 6552.0, 11710.0, 21766.0, 40267.0, 73989.0, 126542.0, 183744.0, 198741.0, 157376.0, 97568.0, 54566.0, 29636.0, 15965.0, 8490.0, 4685.0, 2838.0, 1650.0, 1036.0, 675.0, 439.0, 256.0, 193.0, 117.0, 93.0, 56.0, 38.0, 30.0, 20.0, 9.0, 10.0, 10.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -31.12841796875, -30.1630859375, -29.19775390625, -28.232421875, -27.26708984375, -26.3017578125, -25.33642578125, -24.37109375, -23.40576171875, -22.4404296875, -21.47509765625, -20.509765625, -19.54443359375, -18.5791015625, -17.61376953125, -16.6484375, -15.68310546875, -14.7177734375, -13.75244140625, -12.787109375, -11.82177734375, -10.8564453125, -9.89111328125, -8.92578125, -7.96044921875, -6.9951171875, -6.02978515625, -5.064453125, -4.09912109375, -3.1337890625, -2.16845703125, -1.203125, -0.23779296875, 0.7275390625, 1.69287109375, 2.658203125, 3.62353515625, 4.5888671875, 5.55419921875, 6.51953125, 7.48486328125, 8.4501953125, 9.41552734375, 10.380859375, 11.34619140625, 12.3115234375, 13.27685546875, 14.2421875, 15.20751953125, 16.1728515625, 17.13818359375, 18.103515625, 19.06884765625, 20.0341796875, 20.99951171875, 21.96484375, 22.93017578125, 23.8955078125, 24.86083984375, 25.826171875, 26.79150390625, 27.7568359375, 28.72216796875, 29.6875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 6.0, 6.0, 10.0, 14.0, 18.0, 20.0, 21.0, 31.0, 26.0, 33.0, 22.0, 27.0, 30.0, 33.0, 44.0, 35.0, 48.0, 44.0, 35.0, 43.0, 39.0, 26.0, 39.0, 42.0, 42.0, 32.0, 27.0, 25.0, 24.0, 26.0, 14.0, 17.0, 24.0, 11.0, 10.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0859375, -10.746337890625, -10.40673828125, -10.067138671875, -9.7275390625, -9.387939453125, -9.04833984375, -8.708740234375, -8.369140625, -8.029541015625, -7.68994140625, -7.350341796875, -7.0107421875, -6.671142578125, -6.33154296875, -5.991943359375, -5.65234375, -5.312744140625, -4.97314453125, -4.633544921875, -4.2939453125, -3.954345703125, -3.61474609375, -3.275146484375, -2.935546875, -2.595947265625, -2.25634765625, -1.916748046875, -1.5771484375, -1.237548828125, -0.89794921875, -0.558349609375, -0.21875, 0.120849609375, 0.46044921875, 0.800048828125, 1.1396484375, 1.479248046875, 1.81884765625, 2.158447265625, 2.498046875, 2.837646484375, 3.17724609375, 3.516845703125, 3.8564453125, 4.196044921875, 4.53564453125, 4.875244140625, 5.21484375, 5.554443359375, 5.89404296875, 6.233642578125, 6.5732421875, 6.912841796875, 7.25244140625, 7.592041015625, 7.931640625, 8.271240234375, 8.61083984375, 8.950439453125, 9.2900390625, 9.629638671875, 9.96923828125, 10.308837890625, 10.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 12.0, 29.0, 29.0, 37.0, 66.0, 99.0, 116.0, 191.0, 267.0, 390.0, 628.0, 1010.0, 1638.0, 2523.0, 4262.0, 7166.0, 12778.0, 22758.0, 42077.0, 75862.0, 126356.0, 178760.0, 192373.0, 152870.0, 98686.0, 55954.0, 31003.0, 16797.0, 9639.0, 5445.0, 3205.0, 1977.0, 1224.0, 825.0, 526.0, 301.0, 223.0, 122.0, 94.0, 81.0, 49.0, 25.0, 25.0, 13.0, 13.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.33245849609375, -6.1297607421875, -5.92706298828125, -5.724365234375, -5.52166748046875, -5.3189697265625, -5.11627197265625, -4.91357421875, -4.71087646484375, -4.5081787109375, -4.30548095703125, -4.102783203125, -3.90008544921875, -3.6973876953125, -3.49468994140625, -3.2919921875, -3.08929443359375, -2.8865966796875, -2.68389892578125, -2.481201171875, -2.27850341796875, -2.0758056640625, -1.87310791015625, -1.67041015625, -1.46771240234375, -1.2650146484375, -1.06231689453125, -0.859619140625, -0.65692138671875, -0.4542236328125, -0.25152587890625, -0.048828125, 0.15386962890625, 0.3565673828125, 0.55926513671875, 0.761962890625, 0.96466064453125, 1.1673583984375, 1.37005615234375, 1.57275390625, 1.77545166015625, 1.9781494140625, 2.18084716796875, 2.383544921875, 2.58624267578125, 2.7889404296875, 2.99163818359375, 3.1943359375, 3.39703369140625, 3.5997314453125, 3.80242919921875, 4.005126953125, 4.20782470703125, 4.4105224609375, 4.61322021484375, 4.81591796875, 5.01861572265625, 5.2213134765625, 5.42401123046875, 5.626708984375, 5.82940673828125, 6.0321044921875, 6.23480224609375, 6.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 21.0, 30.0, 39.0, 47.0, 60.0, 50.0, 61.0, 81.0, 77.0, 75.0, 55.0, 67.0, 45.0, 44.0, 51.0, 32.0, 18.0, 26.0, 11.0, 14.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205009460449219, -0.000696226954460144, -0.0006719529628753662, -0.0006476789712905884, -0.0006234049797058105, -0.0005991309881210327, -0.0005748569965362549, -0.000550583004951477, -0.0005263090133666992, -0.0005020350217819214, -0.00047776103019714355, -0.0004534870386123657, -0.0004292130470275879, -0.00040493905544281006, -0.0003806650638580322, -0.0003563910722732544, -0.00033211708068847656, -0.00030784308910369873, -0.0002835690975189209, -0.00025929510593414307, -0.00023502111434936523, -0.0002107471227645874, -0.00018647313117980957, -0.00016219913959503174, -0.0001379251480102539, -0.00011365115642547607, -8.937716484069824e-05, -6.510317325592041e-05, -4.082918167114258e-05, -1.6555190086364746e-05, 7.718801498413086e-06, 3.199279308319092e-05, 5.626678466796875e-05, 8.054077625274658e-05, 0.00010481476783752441, 0.00012908875942230225, 0.00015336275100708008, 0.0001776367425918579, 0.00020191073417663574, 0.00022618472576141357, 0.0002504587173461914, 0.00027473270893096924, 0.00029900670051574707, 0.0003232806921005249, 0.00034755468368530273, 0.00037182867527008057, 0.0003961026668548584, 0.00042037665843963623, 0.00044465065002441406, 0.0004689246416091919, 0.0004931986331939697, 0.0005174726247787476, 0.0005417466163635254, 0.0005660206079483032, 0.0005902945995330811, 0.0006145685911178589, 0.0006388425827026367, 0.0006631165742874146, 0.0006873905658721924, 0.0007116645574569702, 0.000735938549041748, 0.0007602125406265259, 0.0007844865322113037, 0.0008087605237960815, 0.0008330345153808594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 20.0, 22.0, 26.0, 43.0, 71.0, 86.0, 95.0, 178.0, 261.0, 355.0, 510.0, 776.0, 1164.0, 1675.0, 2551.0, 3835.0, 5856.0, 9429.0, 15566.0, 25439.0, 41646.0, 66027.0, 99386.0, 134725.0, 155030.0, 147164.0, 116670.0, 81918.0, 52284.0, 32255.0, 20000.0, 11980.0, 7501.0, 4703.0, 3029.0, 2009.0, 1376.0, 936.0, 629.0, 431.0, 286.0, 181.0, 128.0, 93.0, 75.0, 46.0, 29.0, 17.0, 12.0, 4.0, 10.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0], "bins": [-5.28125, -5.1148681640625, -4.948486328125, -4.7821044921875, -4.61572265625, -4.4493408203125, -4.282958984375, -4.1165771484375, -3.9501953125, -3.7838134765625, -3.617431640625, -3.4510498046875, -3.28466796875, -3.1182861328125, -2.951904296875, -2.7855224609375, -2.619140625, -2.4527587890625, -2.286376953125, -2.1199951171875, -1.95361328125, -1.7872314453125, -1.620849609375, -1.4544677734375, -1.2880859375, -1.1217041015625, -0.955322265625, -0.7889404296875, -0.62255859375, -0.4561767578125, -0.289794921875, -0.1234130859375, 0.04296875, 0.2093505859375, 0.375732421875, 0.5421142578125, 0.70849609375, 0.8748779296875, 1.041259765625, 1.2076416015625, 1.3740234375, 1.5404052734375, 1.706787109375, 1.8731689453125, 2.03955078125, 2.2059326171875, 2.372314453125, 2.5386962890625, 2.705078125, 2.8714599609375, 3.037841796875, 3.2042236328125, 3.37060546875, 3.5369873046875, 3.703369140625, 3.8697509765625, 4.0361328125, 4.2025146484375, 4.368896484375, 4.5352783203125, 4.70166015625, 4.8680419921875, 5.034423828125, 5.2008056640625, 5.3671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 2.0, 6.0, 6.0, 6.0, 10.0, 9.0, 17.0, 23.0, 21.0, 36.0, 25.0, 33.0, 37.0, 33.0, 42.0, 57.0, 44.0, 48.0, 39.0, 48.0, 62.0, 37.0, 37.0, 50.0, 40.0, 31.0, 32.0, 33.0, 28.0, 19.0, 17.0, 14.0, 10.0, 7.0, 13.0, 4.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.25390625, -2.192779541015625, -2.13165283203125, -2.070526123046875, -2.0093994140625, -1.948272705078125, -1.88714599609375, -1.826019287109375, -1.764892578125, -1.703765869140625, -1.64263916015625, -1.581512451171875, -1.5203857421875, -1.459259033203125, -1.39813232421875, -1.337005615234375, -1.27587890625, -1.214752197265625, -1.15362548828125, -1.092498779296875, -1.0313720703125, -0.970245361328125, -0.90911865234375, -0.847991943359375, -0.786865234375, -0.725738525390625, -0.66461181640625, -0.603485107421875, -0.5423583984375, -0.481231689453125, -0.42010498046875, -0.358978271484375, -0.2978515625, -0.236724853515625, -0.17559814453125, -0.114471435546875, -0.0533447265625, 0.007781982421875, 0.06890869140625, 0.130035400390625, 0.191162109375, 0.252288818359375, 0.31341552734375, 0.374542236328125, 0.4356689453125, 0.496795654296875, 0.55792236328125, 0.619049072265625, 0.68017578125, 0.741302490234375, 0.80242919921875, 0.863555908203125, 0.9246826171875, 0.985809326171875, 1.04693603515625, 1.108062744140625, 1.169189453125, 1.230316162109375, 1.29144287109375, 1.352569580078125, 1.4136962890625, 1.474822998046875, 1.53594970703125, 1.597076416015625, 1.658203125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 3.0, 9.0, 8.0, 14.0, 14.0, 26.0, 34.0, 38.0, 37.0, 29.0, 45.0, 41.0, 55.0, 70.0, 65.0, 61.0, 49.0, 50.0, 43.0, 48.0, 47.0, 35.0, 25.0, 18.0, 25.0, 19.0, 19.0, 15.0, 18.0, 9.0, 4.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.121753692626953, -19.388927459716797, -18.65610122680664, -17.923274993896484, -17.190446853637695, -16.45762062072754, -15.724794387817383, -14.991968154907227, -14.25914192199707, -13.526315689086914, -12.793488502502441, -12.060662269592285, -11.327836036682129, -10.595008850097656, -9.8621826171875, -9.129356384277344, -8.396529197692871, -7.663702487945557, -6.9308762550354, -6.198049545288086, -5.46522331237793, -4.732396602630615, -3.999569892883301, -3.2667436599731445, -2.53391695022583, -1.8010904788970947, -1.0682638883590698, -0.3354372978210449, 0.39738917350769043, 1.1302156448364258, 1.8630423545837402, 2.5958685874938965, 3.328695297241211, 4.061522006988525, 4.794348239898682, 5.527174949645996, 6.260001182556152, 6.992827892303467, 7.725654602050781, 8.458480834960938, 9.191307067871094, 9.92413330078125, 10.656960487365723, 11.389786720275879, 12.122612953186035, 12.855440139770508, 13.588266372680664, 14.32109260559082, 15.053919792175293, 15.78674602508545, 16.519573211669922, 17.252399444580078, 17.985225677490234, 18.71805191040039, 19.450878143310547, 20.183704376220703, 20.916532516479492, 21.64935874938965, 22.382184982299805, 23.115013122558594, 23.84783935546875, 24.580665588378906, 25.313491821289062, 26.04631805419922, 26.779144287109375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 11.0, 14.0, 14.0, 17.0, 19.0, 20.0, 27.0, 41.0, 34.0, 36.0, 45.0, 40.0, 44.0, 41.0, 37.0, 48.0, 40.0, 40.0, 36.0, 39.0, 41.0, 34.0, 24.0, 36.0, 25.0, 29.0, 22.0, 21.0, 29.0, 12.0, 9.0, 9.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.59825897216797, -17.011245727539062, -16.424232482910156, -15.837221145629883, -15.250207901000977, -14.66319465637207, -14.07618236541748, -13.48917007446289, -12.902156829833984, -12.315143585205078, -11.728131294250488, -11.141119003295898, -10.554105758666992, -9.967092514038086, -9.380080223083496, -8.793067932128906, -8.2060546875, -7.619041919708252, -7.032029151916504, -6.445016384124756, -5.858003616333008, -5.27099084854126, -4.683978080749512, -4.096965312957764, -3.5099525451660156, -2.9229397773742676, -2.3359270095825195, -1.7489142417907715, -1.1619014739990234, -0.5748887062072754, 0.012124061584472656, 0.5991368293762207, 1.1861495971679688, 1.7731623649597168, 2.360175132751465, 2.947187900543213, 3.534200668334961, 4.121213436126709, 4.708226203918457, 5.295238971710205, 5.882251739501953, 6.469264507293701, 7.056277275085449, 7.643290042877197, 8.230302810668945, 8.817316055297852, 9.404328346252441, 9.991340637207031, 10.578353881835938, 11.165367126464844, 11.752379417419434, 12.339391708374023, 12.92640495300293, 13.513418197631836, 14.100430488586426, 14.687442779541016, 15.274456024169922, 15.861469268798828, 16.448482513427734, 17.035493850708008, 17.622507095336914, 18.20952033996582, 18.796531677246094, 19.383544921875, 19.970558166503906]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 14.0, 13.0, 24.0, 39.0, 66.0, 87.0, 136.0, 211.0, 329.0, 468.0, 707.0, 953.0, 1549.0, 2345.0, 3784.0, 5881.0, 9411.0, 15064.0, 24340.0, 40179.0, 66922.0, 111205.0, 186913.0, 307437.0, 471069.0, 625294.0, 675780.0, 580351.0, 410254.0, 258314.0, 156021.0, 93356.0, 55705.0, 33671.0, 20796.0, 12798.0, 8066.0, 5061.0, 3339.0, 2168.0, 1431.0, 920.0, 602.0, 413.0, 267.0, 183.0, 109.0, 83.0, 46.0, 39.0, 24.0, 18.0, 13.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-17.8125, -17.243896484375, -16.67529296875, -16.106689453125, -15.5380859375, -14.969482421875, -14.40087890625, -13.832275390625, -13.263671875, -12.695068359375, -12.12646484375, -11.557861328125, -10.9892578125, -10.420654296875, -9.85205078125, -9.283447265625, -8.71484375, -8.146240234375, -7.57763671875, -7.009033203125, -6.4404296875, -5.871826171875, -5.30322265625, -4.734619140625, -4.166015625, -3.597412109375, -3.02880859375, -2.460205078125, -1.8916015625, -1.322998046875, -0.75439453125, -0.185791015625, 0.3828125, 0.951416015625, 1.52001953125, 2.088623046875, 2.6572265625, 3.225830078125, 3.79443359375, 4.363037109375, 4.931640625, 5.500244140625, 6.06884765625, 6.637451171875, 7.2060546875, 7.774658203125, 8.34326171875, 8.911865234375, 9.48046875, 10.049072265625, 10.61767578125, 11.186279296875, 11.7548828125, 12.323486328125, 12.89208984375, 13.460693359375, 14.029296875, 14.597900390625, 15.16650390625, 15.735107421875, 16.3037109375, 16.872314453125, 17.44091796875, 18.009521484375, 18.578125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 16.0, 9.0, 18.0, 16.0, 19.0, 26.0, 30.0, 30.0, 40.0, 31.0, 28.0, 37.0, 43.0, 55.0, 36.0, 39.0, 43.0, 36.0, 40.0, 34.0, 36.0, 28.0, 31.0, 34.0, 32.0, 25.0, 20.0, 22.0, 26.0, 19.0, 19.0, 7.0, 10.0, 9.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -13.0443115234375, -12.580810546875, -12.1173095703125, -11.65380859375, -11.1903076171875, -10.726806640625, -10.2633056640625, -9.7998046875, -9.3363037109375, -8.872802734375, -8.4093017578125, -7.94580078125, -7.4822998046875, -7.018798828125, -6.5552978515625, -6.091796875, -5.6282958984375, -5.164794921875, -4.7012939453125, -4.23779296875, -3.7742919921875, -3.310791015625, -2.8472900390625, -2.3837890625, -1.9202880859375, -1.456787109375, -0.9932861328125, -0.52978515625, -0.0662841796875, 0.397216796875, 0.8607177734375, 1.32421875, 1.7877197265625, 2.251220703125, 2.7147216796875, 3.17822265625, 3.6417236328125, 4.105224609375, 4.5687255859375, 5.0322265625, 5.4957275390625, 5.959228515625, 6.4227294921875, 6.88623046875, 7.3497314453125, 7.813232421875, 8.2767333984375, 8.740234375, 9.2037353515625, 9.667236328125, 10.1307373046875, 10.59423828125, 11.0577392578125, 11.521240234375, 11.9847412109375, 12.4482421875, 12.9117431640625, 13.375244140625, 13.8387451171875, 14.30224609375, 14.7657470703125, 15.229248046875, 15.6927490234375, 16.15625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 12.0, 13.0, 22.0, 38.0, 59.0, 99.0, 190.0, 290.0, 410.0, 659.0, 1058.0, 1718.0, 2839.0, 4502.0, 7384.0, 11832.0, 19624.0, 32114.0, 52969.0, 85688.0, 138441.0, 217581.0, 327406.0, 457169.0, 564245.0, 591419.0, 525101.0, 400423.0, 277134.0, 179803.0, 113693.0, 69792.0, 42917.0, 26202.0, 16114.0, 9735.0, 6007.0, 3634.0, 2191.0, 1367.0, 867.0, 545.0, 380.0, 218.0, 153.0, 81.0, 57.0, 37.0, 21.0, 17.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.5927734375, -16.044921875, -15.4970703125, -14.94921875, -14.4013671875, -13.853515625, -13.3056640625, -12.7578125, -12.2099609375, -11.662109375, -11.1142578125, -10.56640625, -10.0185546875, -9.470703125, -8.9228515625, -8.375, -7.8271484375, -7.279296875, -6.7314453125, -6.18359375, -5.6357421875, -5.087890625, -4.5400390625, -3.9921875, -3.4443359375, -2.896484375, -2.3486328125, -1.80078125, -1.2529296875, -0.705078125, -0.1572265625, 0.390625, 0.9384765625, 1.486328125, 2.0341796875, 2.58203125, 3.1298828125, 3.677734375, 4.2255859375, 4.7734375, 5.3212890625, 5.869140625, 6.4169921875, 6.96484375, 7.5126953125, 8.060546875, 8.6083984375, 9.15625, 9.7041015625, 10.251953125, 10.7998046875, 11.34765625, 11.8955078125, 12.443359375, 12.9912109375, 13.5390625, 14.0869140625, 14.634765625, 15.1826171875, 15.73046875, 16.2783203125, 16.826171875, 17.3740234375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 7.0, 8.0, 10.0, 15.0, 20.0, 36.0, 40.0, 45.0, 46.0, 82.0, 81.0, 99.0, 129.0, 153.0, 180.0, 186.0, 207.0, 245.0, 235.0, 250.0, 231.0, 213.0, 227.0, 212.0, 200.0, 163.0, 164.0, 118.0, 93.0, 85.0, 60.0, 49.0, 29.0, 39.0, 27.0, 19.0, 20.0, 12.0, 10.0, 5.0, 6.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.05029296875, -6.7958984375, -6.54150390625, -6.287109375, -6.03271484375, -5.7783203125, -5.52392578125, -5.26953125, -5.01513671875, -4.7607421875, -4.50634765625, -4.251953125, -3.99755859375, -3.7431640625, -3.48876953125, -3.234375, -2.97998046875, -2.7255859375, -2.47119140625, -2.216796875, -1.96240234375, -1.7080078125, -1.45361328125, -1.19921875, -0.94482421875, -0.6904296875, -0.43603515625, -0.181640625, 0.07275390625, 0.3271484375, 0.58154296875, 0.8359375, 1.09033203125, 1.3447265625, 1.59912109375, 1.853515625, 2.10791015625, 2.3623046875, 2.61669921875, 2.87109375, 3.12548828125, 3.3798828125, 3.63427734375, 3.888671875, 4.14306640625, 4.3974609375, 4.65185546875, 4.90625, 5.16064453125, 5.4150390625, 5.66943359375, 5.923828125, 6.17822265625, 6.4326171875, 6.68701171875, 6.94140625, 7.19580078125, 7.4501953125, 7.70458984375, 7.958984375, 8.21337890625, 8.4677734375, 8.72216796875, 8.9765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 11.0, 15.0, 11.0, 13.0, 22.0, 18.0, 26.0, 45.0, 25.0, 34.0, 45.0, 43.0, 37.0, 53.0, 46.0, 43.0, 36.0, 42.0, 51.0, 33.0, 36.0, 34.0, 35.0, 32.0, 27.0, 34.0, 24.0, 17.0, 21.0, 12.0, 12.0, 12.0, 10.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-20.966812133789062, -20.371826171875, -19.776840209960938, -19.181856155395508, -18.586870193481445, -17.991884231567383, -17.39689826965332, -16.801912307739258, -16.206928253173828, -15.611942291259766, -15.01695728302002, -14.421971321105957, -13.826986312866211, -13.232000350952148, -12.637014389038086, -12.042028427124023, -11.447042465209961, -10.852056503295898, -10.257071495056152, -9.66208553314209, -9.067100524902344, -8.472114562988281, -7.877128601074219, -7.2821431159973145, -6.68715763092041, -6.092172145843506, -5.497186660766602, -4.902200698852539, -4.307215213775635, -3.7122297286987305, -3.117244005203247, -2.5222582817077637, -1.9272747039794922, -1.3322890996932983, -0.7373034954071045, -0.14231789112091064, 0.4526677131652832, 1.0476531982421875, 1.642638921737671, 2.2376246452331543, 2.8326101303100586, 3.427595615386963, 4.022581100463867, 4.61756706237793, 5.212552547454834, 5.807538032531738, 6.402523994445801, 6.997509479522705, 7.592494964599609, 8.187480926513672, 8.782465934753418, 9.37745189666748, 9.972436904907227, 10.567422866821289, 11.162408828735352, 11.757394790649414, 12.35237979888916, 12.947365760803223, 13.542350769042969, 14.137336730957031, 14.732322692871094, 15.32730770111084, 15.922293663024902, 16.51727867126465, 17.11226463317871]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 8.0, 5.0, 6.0, 14.0, 12.0, 14.0, 12.0, 17.0, 23.0, 18.0, 26.0, 29.0, 44.0, 25.0, 37.0, 39.0, 40.0, 40.0, 29.0, 45.0, 49.0, 43.0, 41.0, 34.0, 43.0, 28.0, 33.0, 33.0, 35.0, 23.0, 18.0, 21.0, 9.0, 21.0, 19.0, 12.0, 9.0, 8.0, 6.0, 5.0, 5.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.620214462280273, -16.067855834960938, -15.515498161315918, -14.963139533996582, -14.410780906677246, -13.858423233032227, -13.30606460571289, -12.753705978393555, -12.201347351074219, -11.648988723754883, -11.096631050109863, -10.544272422790527, -9.991913795471191, -9.439556121826172, -8.887197494506836, -8.3348388671875, -7.7824811935424805, -7.230123043060303, -6.677764415740967, -6.125406265258789, -5.573047637939453, -5.020689487457275, -4.468331336975098, -3.915972948074341, -3.363614559173584, -2.811256170272827, -2.2588977813720703, -1.7065396308898926, -1.1541812419891357, -0.6018228530883789, -0.04946470260620117, 0.5028936862945557, 1.0552520751953125, 1.6076104640960693, 2.159968852996826, 2.712327003479004, 3.2646853923797607, 3.8170437812805176, 4.369401931762695, 4.921760559082031, 5.474118709564209, 6.026476860046387, 6.578835487365723, 7.1311936378479, 7.683551788330078, 8.235910415649414, 8.78826904296875, 9.34062671661377, 9.892985343933105, 10.445343971252441, 10.997701644897461, 11.550060272216797, 12.102418899536133, 12.654777526855469, 13.207135200500488, 13.759493827819824, 14.311851501464844, 14.86421012878418, 15.4165678024292, 15.968926429748535, 16.521284103393555, 17.07364273071289, 17.626001358032227, 18.178359985351562, 18.7307186126709]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 16.0, 27.0, 41.0, 54.0, 78.0, 104.0, 165.0, 297.0, 410.0, 525.0, 854.0, 1247.0, 1853.0, 2706.0, 4025.0, 5658.0, 8446.0, 12080.0, 17289.0, 24337.0, 33711.0, 45289.0, 59062.0, 73442.0, 87252.0, 96743.0, 100745.0, 97113.0, 87187.0, 73312.0, 58111.0, 44812.0, 32761.0, 23868.0, 17001.0, 11806.0, 8188.0, 5631.0, 3917.0, 2709.0, 1821.0, 1261.0, 853.0, 580.0, 388.0, 251.0, 186.0, 125.0, 86.0, 48.0, 26.0, 24.0, 10.0, 12.0, 9.0, 4.0, 1.0, 1.0], "bins": [-7.19921875, -6.9775390625, -6.755859375, -6.5341796875, -6.3125, -6.0908203125, -5.869140625, -5.6474609375, -5.42578125, -5.2041015625, -4.982421875, -4.7607421875, -4.5390625, -4.3173828125, -4.095703125, -3.8740234375, -3.65234375, -3.4306640625, -3.208984375, -2.9873046875, -2.765625, -2.5439453125, -2.322265625, -2.1005859375, -1.87890625, -1.6572265625, -1.435546875, -1.2138671875, -0.9921875, -0.7705078125, -0.548828125, -0.3271484375, -0.10546875, 0.1162109375, 0.337890625, 0.5595703125, 0.78125, 1.0029296875, 1.224609375, 1.4462890625, 1.66796875, 1.8896484375, 2.111328125, 2.3330078125, 2.5546875, 2.7763671875, 2.998046875, 3.2197265625, 3.44140625, 3.6630859375, 3.884765625, 4.1064453125, 4.328125, 4.5498046875, 4.771484375, 4.9931640625, 5.21484375, 5.4365234375, 5.658203125, 5.8798828125, 6.1015625, 6.3232421875, 6.544921875, 6.7666015625, 6.98828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 8.0, 6.0, 6.0, 11.0, 11.0, 17.0, 11.0, 17.0, 21.0, 17.0, 28.0, 22.0, 40.0, 31.0, 33.0, 44.0, 35.0, 43.0, 30.0, 37.0, 57.0, 40.0, 38.0, 42.0, 35.0, 31.0, 33.0, 34.0, 33.0, 28.0, 24.0, 13.0, 18.0, 17.0, 18.0, 12.0, 16.0, 4.0, 5.0, 7.0, 4.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.0625, -16.50537109375, -15.9482421875, -15.39111328125, -14.833984375, -14.27685546875, -13.7197265625, -13.16259765625, -12.60546875, -12.04833984375, -11.4912109375, -10.93408203125, -10.376953125, -9.81982421875, -9.2626953125, -8.70556640625, -8.1484375, -7.59130859375, -7.0341796875, -6.47705078125, -5.919921875, -5.36279296875, -4.8056640625, -4.24853515625, -3.69140625, -3.13427734375, -2.5771484375, -2.02001953125, -1.462890625, -0.90576171875, -0.3486328125, 0.20849609375, 0.765625, 1.32275390625, 1.8798828125, 2.43701171875, 2.994140625, 3.55126953125, 4.1083984375, 4.66552734375, 5.22265625, 5.77978515625, 6.3369140625, 6.89404296875, 7.451171875, 8.00830078125, 8.5654296875, 9.12255859375, 9.6796875, 10.23681640625, 10.7939453125, 11.35107421875, 11.908203125, 12.46533203125, 13.0224609375, 13.57958984375, 14.13671875, 14.69384765625, 15.2509765625, 15.80810546875, 16.365234375, 16.92236328125, 17.4794921875, 18.03662109375, 18.59375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 12.0, 18.0, 34.0, 57.0, 57.0, 93.0, 131.0, 188.0, 325.0, 488.0, 696.0, 1217.0, 1737.0, 2838.0, 4424.0, 6767.0, 10574.0, 16867.0, 27315.0, 124076.0, 740112.0, 47849.0, 22855.0, 14246.0, 8893.0, 5933.0, 3764.0, 2378.0, 1567.0, 1017.0, 688.0, 458.0, 315.0, 192.0, 121.0, 74.0, 54.0, 36.0, 23.0, 12.0, 11.0, 6.0, 12.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.703125, -16.169921875, -15.63671875, -15.103515625, -14.5703125, -14.037109375, -13.50390625, -12.970703125, -12.4375, -11.904296875, -11.37109375, -10.837890625, -10.3046875, -9.771484375, -9.23828125, -8.705078125, -8.171875, -7.638671875, -7.10546875, -6.572265625, -6.0390625, -5.505859375, -4.97265625, -4.439453125, -3.90625, -3.373046875, -2.83984375, -2.306640625, -1.7734375, -1.240234375, -0.70703125, -0.173828125, 0.359375, 0.892578125, 1.42578125, 1.958984375, 2.4921875, 3.025390625, 3.55859375, 4.091796875, 4.625, 5.158203125, 5.69140625, 6.224609375, 6.7578125, 7.291015625, 7.82421875, 8.357421875, 8.890625, 9.423828125, 9.95703125, 10.490234375, 11.0234375, 11.556640625, 12.08984375, 12.623046875, 13.15625, 13.689453125, 14.22265625, 14.755859375, 15.2890625, 15.822265625, 16.35546875, 16.888671875, 17.421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 10.0, 14.0, 6.0, 16.0, 22.0, 28.0, 25.0, 13.0, 31.0, 30.0, 29.0, 32.0, 43.0, 41.0, 49.0, 32.0, 45.0, 36.0, 44.0, 39.0, 33.0, 46.0, 33.0, 35.0, 30.0, 30.0, 29.0, 31.0, 19.0, 18.0, 21.0, 17.0, 13.0, 8.0, 7.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.359375, -14.915283203125, -14.47119140625, -14.027099609375, -13.5830078125, -13.138916015625, -12.69482421875, -12.250732421875, -11.806640625, -11.362548828125, -10.91845703125, -10.474365234375, -10.0302734375, -9.586181640625, -9.14208984375, -8.697998046875, -8.25390625, -7.809814453125, -7.36572265625, -6.921630859375, -6.4775390625, -6.033447265625, -5.58935546875, -5.145263671875, -4.701171875, -4.257080078125, -3.81298828125, -3.368896484375, -2.9248046875, -2.480712890625, -2.03662109375, -1.592529296875, -1.1484375, -0.704345703125, -0.26025390625, 0.183837890625, 0.6279296875, 1.072021484375, 1.51611328125, 1.960205078125, 2.404296875, 2.848388671875, 3.29248046875, 3.736572265625, 4.1806640625, 4.624755859375, 5.06884765625, 5.512939453125, 5.95703125, 6.401123046875, 6.84521484375, 7.289306640625, 7.7333984375, 8.177490234375, 8.62158203125, 9.065673828125, 9.509765625, 9.953857421875, 10.39794921875, 10.842041015625, 11.2861328125, 11.730224609375, 12.17431640625, 12.618408203125, 13.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 14.0, 12.0, 30.0, 23.0, 44.0, 59.0, 69.0, 115.0, 125.0, 226.0, 345.0, 552.0, 1013.0, 1862.0, 3799.0, 8366.0, 22332.0, 118281.0, 830430.0, 37139.0, 12661.0, 5166.0, 2515.0, 1330.0, 755.0, 426.0, 279.0, 165.0, 114.0, 90.0, 42.0, 44.0, 33.0, 30.0, 18.0, 9.0, 3.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.65234375, -2.5748291015625, -2.497314453125, -2.4197998046875, -2.34228515625, -2.2647705078125, -2.187255859375, -2.1097412109375, -2.0322265625, -1.9547119140625, -1.877197265625, -1.7996826171875, -1.72216796875, -1.6446533203125, -1.567138671875, -1.4896240234375, -1.412109375, -1.3345947265625, -1.257080078125, -1.1795654296875, -1.10205078125, -1.0245361328125, -0.947021484375, -0.8695068359375, -0.7919921875, -0.7144775390625, -0.636962890625, -0.5594482421875, -0.48193359375, -0.4044189453125, -0.326904296875, -0.2493896484375, -0.171875, -0.0943603515625, -0.016845703125, 0.0606689453125, 0.13818359375, 0.2156982421875, 0.293212890625, 0.3707275390625, 0.4482421875, 0.5257568359375, 0.603271484375, 0.6807861328125, 0.75830078125, 0.8358154296875, 0.913330078125, 0.9908447265625, 1.068359375, 1.1458740234375, 1.223388671875, 1.3009033203125, 1.37841796875, 1.4559326171875, 1.533447265625, 1.6109619140625, 1.6884765625, 1.7659912109375, 1.843505859375, 1.9210205078125, 1.99853515625, 2.0760498046875, 2.153564453125, 2.2310791015625, 2.30859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 13.0, 21.0, 15.0, 30.0, 49.0, 49.0, 56.0, 67.0, 67.0, 96.0, 89.0, 83.0, 70.0, 58.0, 48.0, 39.0, 25.0, 26.0, 12.0, 17.0, 13.0, 5.0, 6.0, 5.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004284381866455078, -0.0004131905734539032, -0.0003979429602622986, -0.00038269534707069397, -0.00036744773387908936, -0.00035220012068748474, -0.0003369525074958801, -0.0003217048943042755, -0.0003064572811126709, -0.0002912096679210663, -0.00027596205472946167, -0.00026071444153785706, -0.00024546682834625244, -0.00023021921515464783, -0.0002149716019630432, -0.0001997239887714386, -0.00018447637557983398, -0.00016922876238822937, -0.00015398114919662476, -0.00013873353600502014, -0.00012348592281341553, -0.00010823830962181091, -9.29906964302063e-05, -7.774308323860168e-05, -6.249547004699707e-05, -4.7247856855392456e-05, -3.200024366378784e-05, -1.6752630472183228e-05, -1.5050172805786133e-06, 1.3742595911026001e-05, 2.8990209102630615e-05, 4.423782229423523e-05, 5.9485435485839844e-05, 7.473304867744446e-05, 8.998066186904907e-05, 0.00010522827506065369, 0.0001204758882522583, 0.00013572350144386292, 0.00015097111463546753, 0.00016621872782707214, 0.00018146634101867676, 0.00019671395421028137, 0.00021196156740188599, 0.0002272091805934906, 0.00024245679378509521, 0.00025770440697669983, 0.00027295202016830444, 0.00028819963335990906, 0.00030344724655151367, 0.0003186948597431183, 0.0003339424729347229, 0.0003491900861263275, 0.00036443769931793213, 0.00037968531250953674, 0.00039493292570114136, 0.00041018053889274597, 0.0004254281520843506, 0.0004406757652759552, 0.0004559233784675598, 0.00047117099165916443, 0.00048641860485076904, 0.0005016662180423737, 0.0005169138312339783, 0.0005321614444255829, 0.0005474090576171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 10.0, 18.0, 32.0, 43.0, 62.0, 105.0, 136.0, 155.0, 243.0, 351.0, 576.0, 792.0, 1177.0, 1659.0, 2634.0, 3858.0, 5856.0, 8971.0, 14303.0, 22343.0, 34799.0, 54731.0, 83291.0, 118150.0, 149864.0, 153423.0, 127781.0, 92414.0, 61098.0, 39265.0, 24878.0, 15834.0, 10121.0, 6421.0, 4251.0, 2833.0, 1869.0, 1279.0, 887.0, 634.0, 426.0, 297.0, 235.0, 124.0, 103.0, 64.0, 51.0, 27.0, 22.0, 23.0, 5.0, 11.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.73876953125, -0.7157745361328125, -0.692779541015625, -0.6697845458984375, -0.64678955078125, -0.6237945556640625, -0.600799560546875, -0.5778045654296875, -0.5548095703125, -0.5318145751953125, -0.508819580078125, -0.4858245849609375, -0.46282958984375, -0.4398345947265625, -0.416839599609375, -0.3938446044921875, -0.370849609375, -0.3478546142578125, -0.324859619140625, -0.3018646240234375, -0.27886962890625, -0.2558746337890625, -0.232879638671875, -0.2098846435546875, -0.1868896484375, -0.1638946533203125, -0.140899658203125, -0.1179046630859375, -0.09490966796875, -0.0719146728515625, -0.048919677734375, -0.0259246826171875, -0.0029296875, 0.0200653076171875, 0.043060302734375, 0.0660552978515625, 0.08905029296875, 0.1120452880859375, 0.135040283203125, 0.1580352783203125, 0.1810302734375, 0.2040252685546875, 0.227020263671875, 0.2500152587890625, 0.27301025390625, 0.2960052490234375, 0.319000244140625, 0.3419952392578125, 0.364990234375, 0.3879852294921875, 0.410980224609375, 0.4339752197265625, 0.45697021484375, 0.4799652099609375, 0.502960205078125, 0.5259552001953125, 0.5489501953125, 0.5719451904296875, 0.594940185546875, 0.6179351806640625, 0.64093017578125, 0.6639251708984375, 0.686920166015625, 0.7099151611328125, 0.73291015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 10.0, 11.0, 13.0, 12.0, 20.0, 25.0, 28.0, 34.0, 39.0, 49.0, 67.0, 58.0, 67.0, 50.0, 67.0, 63.0, 55.0, 45.0, 52.0, 31.0, 35.0, 39.0, 21.0, 17.0, 23.0, 6.0, 10.0, 6.0, 5.0, 4.0, 5.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3212547302246094, -0.31047821044921875, -0.2997016906738281, -0.2889251708984375, -0.2781486511230469, -0.26737213134765625, -0.2565956115722656, -0.245819091796875, -0.23504257202148438, -0.22426605224609375, -0.21348953247070312, -0.2027130126953125, -0.19193649291992188, -0.18115997314453125, -0.17038345336914062, -0.15960693359375, -0.14883041381835938, -0.13805389404296875, -0.12727737426757812, -0.1165008544921875, -0.10572433471679688, -0.09494781494140625, -0.08417129516601562, -0.073394775390625, -0.06261825561523438, -0.05184173583984375, -0.041065216064453125, -0.0302886962890625, -0.019512176513671875, -0.00873565673828125, 0.002040863037109375, 0.0128173828125, 0.023593902587890625, 0.03437042236328125, 0.045146942138671875, 0.0559234619140625, 0.06669998168945312, 0.07747650146484375, 0.08825302124023438, 0.099029541015625, 0.10980606079101562, 0.12058258056640625, 0.13135910034179688, 0.1421356201171875, 0.15291213989257812, 0.16368865966796875, 0.17446517944335938, 0.18524169921875, 0.19601821899414062, 0.20679473876953125, 0.21757125854492188, 0.2283477783203125, 0.23912429809570312, 0.24990081787109375, 0.2606773376464844, 0.271453857421875, 0.2822303771972656, 0.29300689697265625, 0.3037834167480469, 0.3145599365234375, 0.3253364562988281, 0.33611297607421875, 0.3468894958496094, 0.357666015625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 6.0, 17.0, 21.0, 20.0, 7.0, 25.0, 27.0, 31.0, 39.0, 42.0, 55.0, 49.0, 39.0, 45.0, 49.0, 56.0, 47.0, 40.0, 43.0, 38.0, 45.0, 25.0, 28.0, 31.0, 28.0, 22.0, 23.0, 25.0, 19.0, 8.0, 5.0, 11.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8658390045166, -19.23126220703125, -18.5966854095459, -17.962108612060547, -17.327531814575195, -16.692955017089844, -16.058378219604492, -15.42380142211914, -14.789224624633789, -14.154647827148438, -13.520071029663086, -12.885494232177734, -12.250917434692383, -11.616340637207031, -10.98176383972168, -10.347187042236328, -9.712610244750977, -9.078033447265625, -8.443456649780273, -7.808879852294922, -7.17430305480957, -6.539726257324219, -5.905149459838867, -5.270572662353516, -4.635995864868164, -4.0014190673828125, -3.366842269897461, -2.7322654724121094, -2.097688674926758, -1.4631118774414062, -0.8285350799560547, -0.19395828247070312, 0.44061851501464844, 1.0751953125, 1.7097721099853516, 2.344348907470703, 2.9789257049560547, 3.6135025024414062, 4.248079299926758, 4.882656097412109, 5.517232894897461, 6.1518096923828125, 6.786386489868164, 7.420963287353516, 8.055540084838867, 8.690116882324219, 9.32469367980957, 9.959270477294922, 10.593847274780273, 11.228424072265625, 11.863000869750977, 12.497577667236328, 13.13215446472168, 13.766731262207031, 14.401308059692383, 15.035884857177734, 15.670461654663086, 16.305038452148438, 16.93961524963379, 17.57419204711914, 18.208768844604492, 18.843345642089844, 19.477922439575195, 20.112499237060547, 20.7470760345459]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 10.0, 7.0, 5.0, 13.0, 19.0, 9.0, 15.0, 20.0, 16.0, 27.0, 26.0, 39.0, 30.0, 31.0, 39.0, 43.0, 33.0, 43.0, 34.0, 48.0, 43.0, 48.0, 39.0, 37.0, 28.0, 39.0, 31.0, 35.0, 28.0, 24.0, 18.0, 18.0, 11.0, 22.0, 12.0, 12.0, 10.0, 3.0, 7.0, 5.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.38070297241211, -16.81770133972168, -16.25469970703125, -15.69169807434082, -15.12869644165039, -14.565694808959961, -14.002692222595215, -13.439690589904785, -12.876688957214355, -12.313687324523926, -11.750685691833496, -11.187684059143066, -10.62468147277832, -10.06167984008789, -9.498678207397461, -8.935676574707031, -8.372674942016602, -7.809673309326172, -7.246671676635742, -6.683669567108154, -6.120667934417725, -5.557666301727295, -4.994664192199707, -4.431662559509277, -3.8686609268188477, -3.305659294128418, -2.742657423019409, -2.1796555519104004, -1.6166539192199707, -1.053652286529541, -0.4906504154205322, 0.07235145568847656, 0.6353511810302734, 1.1983529329299927, 1.761354684829712, 2.3243565559387207, 2.8873581886291504, 3.45035982131958, 4.013361930847168, 4.576363563537598, 5.139365196228027, 5.702366828918457, 6.265368461608887, 6.828370571136475, 7.391372203826904, 7.954373836517334, 8.517375946044922, 9.080377578735352, 9.643379211425781, 10.206380844116211, 10.76938247680664, 11.33238410949707, 11.8953857421875, 12.45838737487793, 13.021389961242676, 13.584391593933105, 14.147393226623535, 14.710394859313965, 15.273396492004395, 15.836398124694824, 16.39940071105957, 16.96240234375, 17.52540397644043, 18.08840560913086, 18.65140724182129]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 22.0, 23.0, 26.0, 43.0, 73.0, 98.0, 168.0, 246.0, 361.0, 605.0, 879.0, 1472.0, 2254.0, 3742.0, 5787.0, 9419.0, 14824.0, 23262.0, 36112.0, 54032.0, 77219.0, 102599.0, 123586.0, 131778.0, 124522.0, 103128.0, 77307.0, 54633.0, 36254.0, 23459.0, 14975.0, 9599.0, 5901.0, 3662.0, 2353.0, 1466.0, 926.0, 625.0, 404.0, 249.0, 156.0, 115.0, 62.0, 47.0, 34.0, 15.0, 10.0, 8.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.171875, -15.641845703125, -15.11181640625, -14.581787109375, -14.0517578125, -13.521728515625, -12.99169921875, -12.461669921875, -11.931640625, -11.401611328125, -10.87158203125, -10.341552734375, -9.8115234375, -9.281494140625, -8.75146484375, -8.221435546875, -7.69140625, -7.161376953125, -6.63134765625, -6.101318359375, -5.5712890625, -5.041259765625, -4.51123046875, -3.981201171875, -3.451171875, -2.921142578125, -2.39111328125, -1.861083984375, -1.3310546875, -0.801025390625, -0.27099609375, 0.259033203125, 0.7890625, 1.319091796875, 1.84912109375, 2.379150390625, 2.9091796875, 3.439208984375, 3.96923828125, 4.499267578125, 5.029296875, 5.559326171875, 6.08935546875, 6.619384765625, 7.1494140625, 7.679443359375, 8.20947265625, 8.739501953125, 9.26953125, 9.799560546875, 10.32958984375, 10.859619140625, 11.3896484375, 11.919677734375, 12.44970703125, 12.979736328125, 13.509765625, 14.039794921875, 14.56982421875, 15.099853515625, 15.6298828125, 16.159912109375, 16.68994140625, 17.219970703125, 17.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 7.0, 6.0, 10.0, 8.0, 13.0, 14.0, 16.0, 14.0, 21.0, 23.0, 25.0, 30.0, 42.0, 26.0, 31.0, 44.0, 43.0, 28.0, 39.0, 39.0, 55.0, 38.0, 41.0, 39.0, 41.0, 26.0, 40.0, 27.0, 41.0, 20.0, 18.0, 17.0, 21.0, 13.0, 22.0, 8.0, 9.0, 8.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8984375, -15.3746337890625, -14.850830078125, -14.3270263671875, -13.80322265625, -13.2794189453125, -12.755615234375, -12.2318115234375, -11.7080078125, -11.1842041015625, -10.660400390625, -10.1365966796875, -9.61279296875, -9.0889892578125, -8.565185546875, -8.0413818359375, -7.517578125, -6.9937744140625, -6.469970703125, -5.9461669921875, -5.42236328125, -4.8985595703125, -4.374755859375, -3.8509521484375, -3.3271484375, -2.8033447265625, -2.279541015625, -1.7557373046875, -1.23193359375, -0.7081298828125, -0.184326171875, 0.3394775390625, 0.86328125, 1.3870849609375, 1.910888671875, 2.4346923828125, 2.95849609375, 3.4822998046875, 4.006103515625, 4.5299072265625, 5.0537109375, 5.5775146484375, 6.101318359375, 6.6251220703125, 7.14892578125, 7.6727294921875, 8.196533203125, 8.7203369140625, 9.244140625, 9.7679443359375, 10.291748046875, 10.8155517578125, 11.33935546875, 11.8631591796875, 12.386962890625, 12.9107666015625, 13.4345703125, 13.9583740234375, 14.482177734375, 15.0059814453125, 15.52978515625, 16.0535888671875, 16.577392578125, 17.1011962890625, 17.625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 10.0, 19.0, 24.0, 46.0, 62.0, 113.0, 189.0, 283.0, 558.0, 1022.0, 1963.0, 3854.0, 8040.0, 16992.0, 35176.0, 69575.0, 126594.0, 187884.0, 210151.0, 170258.0, 105794.0, 56199.0, 27660.0, 13198.0, 6326.0, 3076.0, 1536.0, 842.0, 443.0, 275.0, 141.0, 85.0, 56.0, 38.0, 18.0, 15.0, 12.0, 7.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5625, -27.67919921875, -26.7958984375, -25.91259765625, -25.029296875, -24.14599609375, -23.2626953125, -22.37939453125, -21.49609375, -20.61279296875, -19.7294921875, -18.84619140625, -17.962890625, -17.07958984375, -16.1962890625, -15.31298828125, -14.4296875, -13.54638671875, -12.6630859375, -11.77978515625, -10.896484375, -10.01318359375, -9.1298828125, -8.24658203125, -7.36328125, -6.47998046875, -5.5966796875, -4.71337890625, -3.830078125, -2.94677734375, -2.0634765625, -1.18017578125, -0.296875, 0.58642578125, 1.4697265625, 2.35302734375, 3.236328125, 4.11962890625, 5.0029296875, 5.88623046875, 6.76953125, 7.65283203125, 8.5361328125, 9.41943359375, 10.302734375, 11.18603515625, 12.0693359375, 12.95263671875, 13.8359375, 14.71923828125, 15.6025390625, 16.48583984375, 17.369140625, 18.25244140625, 19.1357421875, 20.01904296875, 20.90234375, 21.78564453125, 22.6689453125, 23.55224609375, 24.435546875, 25.31884765625, 26.2021484375, 27.08544921875, 27.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 12.0, 15.0, 20.0, 16.0, 20.0, 16.0, 23.0, 23.0, 27.0, 33.0, 31.0, 29.0, 40.0, 39.0, 35.0, 37.0, 38.0, 50.0, 41.0, 33.0, 38.0, 31.0, 35.0, 29.0, 25.0, 32.0, 30.0, 27.0, 20.0, 24.0, 13.0, 15.0, 10.0, 11.0, 9.0, 3.0, 6.0, 12.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.5628662109375, -9.235107421875, -8.9073486328125, -8.57958984375, -8.2518310546875, -7.924072265625, -7.5963134765625, -7.2685546875, -6.9407958984375, -6.613037109375, -6.2852783203125, -5.95751953125, -5.6297607421875, -5.302001953125, -4.9742431640625, -4.646484375, -4.3187255859375, -3.990966796875, -3.6632080078125, -3.33544921875, -3.0076904296875, -2.679931640625, -2.3521728515625, -2.0244140625, -1.6966552734375, -1.368896484375, -1.0411376953125, -0.71337890625, -0.3856201171875, -0.057861328125, 0.2698974609375, 0.59765625, 0.9254150390625, 1.253173828125, 1.5809326171875, 1.90869140625, 2.2364501953125, 2.564208984375, 2.8919677734375, 3.2197265625, 3.5474853515625, 3.875244140625, 4.2030029296875, 4.53076171875, 4.8585205078125, 5.186279296875, 5.5140380859375, 5.841796875, 6.1695556640625, 6.497314453125, 6.8250732421875, 7.15283203125, 7.4805908203125, 7.808349609375, 8.1361083984375, 8.4638671875, 8.7916259765625, 9.119384765625, 9.4471435546875, 9.77490234375, 10.1026611328125, 10.430419921875, 10.7581787109375, 11.0859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 10.0, 9.0, 13.0, 13.0, 16.0, 20.0, 40.0, 75.0, 112.0, 165.0, 256.0, 446.0, 792.0, 1262.0, 2249.0, 3983.0, 7117.0, 13012.0, 23992.0, 44021.0, 77194.0, 128244.0, 177545.0, 190259.0, 152779.0, 98127.0, 56820.0, 31203.0, 17002.0, 9372.0, 5266.0, 2920.0, 1709.0, 1065.0, 545.0, 350.0, 205.0, 133.0, 72.0, 43.0, 40.0, 30.0, 14.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.75, -6.52667236328125, -6.3033447265625, -6.08001708984375, -5.856689453125, -5.63336181640625, -5.4100341796875, -5.18670654296875, -4.96337890625, -4.74005126953125, -4.5167236328125, -4.29339599609375, -4.070068359375, -3.84674072265625, -3.6234130859375, -3.40008544921875, -3.1767578125, -2.95343017578125, -2.7301025390625, -2.50677490234375, -2.283447265625, -2.06011962890625, -1.8367919921875, -1.61346435546875, -1.39013671875, -1.16680908203125, -0.9434814453125, -0.72015380859375, -0.496826171875, -0.27349853515625, -0.0501708984375, 0.17315673828125, 0.396484375, 0.61981201171875, 0.8431396484375, 1.06646728515625, 1.289794921875, 1.51312255859375, 1.7364501953125, 1.95977783203125, 2.18310546875, 2.40643310546875, 2.6297607421875, 2.85308837890625, 3.076416015625, 3.29974365234375, 3.5230712890625, 3.74639892578125, 3.9697265625, 4.19305419921875, 4.4163818359375, 4.63970947265625, 4.863037109375, 5.08636474609375, 5.3096923828125, 5.53302001953125, 5.75634765625, 5.97967529296875, 6.2030029296875, 6.42633056640625, 6.649658203125, 6.87298583984375, 7.0963134765625, 7.31964111328125, 7.54296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 13.0, 10.0, 10.0, 16.0, 14.0, 12.0, 21.0, 31.0, 30.0, 27.0, 43.0, 50.0, 57.0, 47.0, 65.0, 55.0, 61.0, 53.0, 50.0, 53.0, 47.0, 42.0, 38.0, 43.0, 19.0, 19.0, 22.0, 8.0, 13.0, 4.0, 5.0, 8.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006818771362304688, -0.0006601959466934204, -0.0006385147571563721, -0.0006168335676193237, -0.0005951523780822754, -0.000573471188545227, -0.0005517899990081787, -0.0005301088094711304, -0.000508427619934082, -0.0004867464303970337, -0.00046506524085998535, -0.000443384051322937, -0.00042170286178588867, -0.00040002167224884033, -0.000378340482711792, -0.00035665929317474365, -0.0003349781036376953, -0.00031329691410064697, -0.00029161572456359863, -0.0002699345350265503, -0.00024825334548950195, -0.0002265721559524536, -0.00020489096641540527, -0.00018320977687835693, -0.0001615285873413086, -0.00013984739780426025, -0.00011816620826721191, -9.648501873016357e-05, -7.480382919311523e-05, -5.3122639656066895e-05, -3.1441450119018555e-05, -9.760260581970215e-06, 1.1920928955078125e-05, 3.3602118492126465e-05, 5.5283308029174805e-05, 7.696449756622314e-05, 9.864568710327148e-05, 0.00012032687664031982, 0.00014200806617736816, 0.0001636892557144165, 0.00018537044525146484, 0.00020705163478851318, 0.00022873282432556152, 0.00025041401386260986, 0.0002720952033996582, 0.00029377639293670654, 0.0003154575824737549, 0.0003371387720108032, 0.00035881996154785156, 0.0003805011510848999, 0.00040218234062194824, 0.0004238635301589966, 0.0004455447196960449, 0.00046722590923309326, 0.0004889070987701416, 0.0005105882883071899, 0.0005322694778442383, 0.0005539506673812866, 0.000575631856918335, 0.0005973130464553833, 0.0006189942359924316, 0.00064067542552948, 0.0006623566150665283, 0.0006840378046035767, 0.000705718994140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 3.0, 21.0, 22.0, 26.0, 40.0, 62.0, 91.0, 152.0, 222.0, 356.0, 531.0, 904.0, 1526.0, 2624.0, 4707.0, 8441.0, 14890.0, 27291.0, 48287.0, 83246.0, 131362.0, 174683.0, 181170.0, 144838.0, 94676.0, 56228.0, 31616.0, 17460.0, 9899.0, 5490.0, 3168.0, 1763.0, 1021.0, 601.0, 421.0, 218.0, 159.0, 96.0, 68.0, 47.0, 46.0, 24.0, 11.0, 8.0, 5.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1171875, -6.89569091796875, -6.6741943359375, -6.45269775390625, -6.231201171875, -6.00970458984375, -5.7882080078125, -5.56671142578125, -5.34521484375, -5.12371826171875, -4.9022216796875, -4.68072509765625, -4.459228515625, -4.23773193359375, -4.0162353515625, -3.79473876953125, -3.5732421875, -3.35174560546875, -3.1302490234375, -2.90875244140625, -2.687255859375, -2.46575927734375, -2.2442626953125, -2.02276611328125, -1.80126953125, -1.57977294921875, -1.3582763671875, -1.13677978515625, -0.915283203125, -0.69378662109375, -0.4722900390625, -0.25079345703125, -0.029296875, 0.19219970703125, 0.4136962890625, 0.63519287109375, 0.856689453125, 1.07818603515625, 1.2996826171875, 1.52117919921875, 1.74267578125, 1.96417236328125, 2.1856689453125, 2.40716552734375, 2.628662109375, 2.85015869140625, 3.0716552734375, 3.29315185546875, 3.5146484375, 3.73614501953125, 3.9576416015625, 4.17913818359375, 4.400634765625, 4.62213134765625, 4.8436279296875, 5.06512451171875, 5.28662109375, 5.50811767578125, 5.7296142578125, 5.95111083984375, 6.172607421875, 6.39410400390625, 6.6156005859375, 6.83709716796875, 7.05859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 15.0, 7.0, 11.0, 16.0, 15.0, 18.0, 31.0, 36.0, 43.0, 35.0, 45.0, 45.0, 51.0, 44.0, 57.0, 52.0, 52.0, 45.0, 51.0, 44.0, 45.0, 49.0, 28.0, 36.0, 23.0, 20.0, 16.0, 17.0, 15.0, 11.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.091461181640625, -2.01300048828125, -1.934539794921875, -1.8560791015625, -1.777618408203125, -1.69915771484375, -1.620697021484375, -1.542236328125, -1.463775634765625, -1.38531494140625, -1.306854248046875, -1.2283935546875, -1.149932861328125, -1.07147216796875, -0.993011474609375, -0.91455078125, -0.836090087890625, -0.75762939453125, -0.679168701171875, -0.6007080078125, -0.522247314453125, -0.44378662109375, -0.365325927734375, -0.286865234375, -0.208404541015625, -0.12994384765625, -0.051483154296875, 0.0269775390625, 0.105438232421875, 0.18389892578125, 0.262359619140625, 0.3408203125, 0.419281005859375, 0.49774169921875, 0.576202392578125, 0.6546630859375, 0.733123779296875, 0.81158447265625, 0.890045166015625, 0.968505859375, 1.046966552734375, 1.12542724609375, 1.203887939453125, 1.2823486328125, 1.360809326171875, 1.43927001953125, 1.517730712890625, 1.59619140625, 1.674652099609375, 1.75311279296875, 1.831573486328125, 1.9100341796875, 1.988494873046875, 2.06695556640625, 2.145416259765625, 2.223876953125, 2.302337646484375, 2.38079833984375, 2.459259033203125, 2.5377197265625, 2.616180419921875, 2.69464111328125, 2.773101806640625, 2.8515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 10.0, 6.0, 11.0, 11.0, 23.0, 11.0, 19.0, 22.0, 23.0, 35.0, 21.0, 40.0, 43.0, 38.0, 43.0, 50.0, 36.0, 39.0, 48.0, 40.0, 42.0, 29.0, 49.0, 42.0, 31.0, 30.0, 30.0, 25.0, 20.0, 19.0, 17.0, 12.0, 19.0, 11.0, 8.0, 8.0, 5.0, 7.0, 8.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.005413055419922, -17.463844299316406, -16.922273635864258, -16.380704879760742, -15.839134216308594, -15.297565460205078, -14.755995750427246, -14.214426040649414, -13.672856330871582, -13.13128662109375, -12.589716911315918, -12.048147201538086, -11.50657844543457, -10.965007781982422, -10.423439025878906, -9.881869316101074, -9.340299606323242, -8.79872989654541, -8.257160186767578, -7.715590953826904, -7.174021244049072, -6.63245153427124, -6.090882301330566, -5.549312591552734, -5.007742881774902, -4.46617317199707, -3.9246037006378174, -3.3830342292785645, -2.8414645195007324, -2.2998948097229004, -1.7583253383636475, -1.2167558670043945, -0.6751880645751953, -0.13361847400665283, 0.40795111656188965, 0.9495207071304321, 1.4910902976989746, 2.0326600074768066, 2.5742294788360596, 3.1157989501953125, 3.6573686599731445, 4.198938369750977, 4.740508079528809, 5.282077312469482, 5.8236470222473145, 6.3652167320251465, 6.90678596496582, 7.448355674743652, 7.989925384521484, 8.531495094299316, 9.073064804077148, 9.61463451385498, 10.156204223632812, 10.697772979736328, 11.23934268951416, 11.780912399291992, 12.322482109069824, 12.864051818847656, 13.405621528625488, 13.94719123840332, 14.488759994506836, 15.030330657958984, 15.5718994140625, 16.113468170166016, 16.655038833618164]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 9.0, 6.0, 7.0, 9.0, 15.0, 21.0, 19.0, 17.0, 24.0, 26.0, 27.0, 35.0, 37.0, 23.0, 27.0, 41.0, 33.0, 31.0, 39.0, 39.0, 41.0, 40.0, 50.0, 27.0, 37.0, 33.0, 27.0, 32.0, 18.0, 22.0, 16.0, 23.0, 16.0, 17.0, 13.0, 17.0, 12.0, 13.0, 6.0, 12.0, 7.0, 12.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.920804023742676, -14.411434173583984, -13.90206527709961, -13.392695426940918, -12.883325576782227, -12.373955726623535, -11.864585876464844, -11.355216979980469, -10.845847129821777, -10.336477279663086, -9.827108383178711, -9.31773853302002, -8.808368682861328, -8.298998832702637, -7.7896294593811035, -7.28026008605957, -6.770890235900879, -6.2615203857421875, -5.752151012420654, -5.242781639099121, -4.73341178894043, -4.224041938781738, -3.714672565460205, -3.2053029537200928, -2.6959333419799805, -2.186563730239868, -1.6771941184997559, -1.1678245067596436, -0.6584548950195312, -0.14908528327941895, 0.36028432846069336, 0.8696539402008057, 1.3790245056152344, 1.8883941173553467, 2.397763729095459, 2.9071333408355713, 3.4165029525756836, 3.925872564315796, 4.435242176055908, 4.944611549377441, 5.453981399536133, 5.963351249694824, 6.472720623016357, 6.982089996337891, 7.491459846496582, 8.000829696655273, 8.510198593139648, 9.01956844329834, 9.528938293457031, 10.038308143615723, 10.547677993774414, 11.057046890258789, 11.56641674041748, 12.075786590576172, 12.585155487060547, 13.094525337219238, 13.60389518737793, 14.113265037536621, 14.622634887695312, 15.132003784179688, 15.641373634338379, 16.15074348449707, 16.660112380981445, 17.169483184814453, 17.678852081298828]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 10.0, 7.0, 5.0, 7.0, 15.0, 22.0, 44.0, 73.0, 110.0, 158.0, 230.0, 360.0, 603.0, 913.0, 1465.0, 2242.0, 3742.0, 6271.0, 10273.0, 17562.0, 29545.0, 50735.0, 87725.0, 153359.0, 263578.0, 426571.0, 603873.0, 696353.0, 637667.0, 471372.0, 299881.0, 177249.0, 103211.0, 59399.0, 35051.0, 21294.0, 12886.0, 7750.0, 4683.0, 2914.0, 1809.0, 1193.0, 710.0, 462.0, 325.0, 201.0, 153.0, 64.0, 65.0, 42.0, 28.0, 11.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.28125, -16.735107421875, -16.18896484375, -15.642822265625, -15.0966796875, -14.550537109375, -14.00439453125, -13.458251953125, -12.912109375, -12.365966796875, -11.81982421875, -11.273681640625, -10.7275390625, -10.181396484375, -9.63525390625, -9.089111328125, -8.54296875, -7.996826171875, -7.45068359375, -6.904541015625, -6.3583984375, -5.812255859375, -5.26611328125, -4.719970703125, -4.173828125, -3.627685546875, -3.08154296875, -2.535400390625, -1.9892578125, -1.443115234375, -0.89697265625, -0.350830078125, 0.1953125, 0.741455078125, 1.28759765625, 1.833740234375, 2.3798828125, 2.926025390625, 3.47216796875, 4.018310546875, 4.564453125, 5.110595703125, 5.65673828125, 6.202880859375, 6.7490234375, 7.295166015625, 7.84130859375, 8.387451171875, 8.93359375, 9.479736328125, 10.02587890625, 10.572021484375, 11.1181640625, 11.664306640625, 12.21044921875, 12.756591796875, 13.302734375, 13.848876953125, 14.39501953125, 14.941162109375, 15.4873046875, 16.033447265625, 16.57958984375, 17.125732421875, 17.671875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 9.0, 14.0, 17.0, 14.0, 13.0, 15.0, 32.0, 29.0, 23.0, 42.0, 29.0, 29.0, 31.0, 28.0, 46.0, 33.0, 31.0, 36.0, 47.0, 31.0, 41.0, 42.0, 44.0, 35.0, 30.0, 17.0, 15.0, 25.0, 20.0, 21.0, 14.0, 20.0, 16.0, 8.0, 11.0, 9.0, 11.0, 9.0, 5.0, 12.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.6796875, -12.23828125, -11.796875, -11.35546875, -10.9140625, -10.47265625, -10.03125, -9.58984375, -9.1484375, -8.70703125, -8.265625, -7.82421875, -7.3828125, -6.94140625, -6.5, -6.05859375, -5.6171875, -5.17578125, -4.734375, -4.29296875, -3.8515625, -3.41015625, -2.96875, -2.52734375, -2.0859375, -1.64453125, -1.203125, -0.76171875, -0.3203125, 0.12109375, 0.5625, 1.00390625, 1.4453125, 1.88671875, 2.328125, 2.76953125, 3.2109375, 3.65234375, 4.09375, 4.53515625, 4.9765625, 5.41796875, 5.859375, 6.30078125, 6.7421875, 7.18359375, 7.625, 8.06640625, 8.5078125, 8.94921875, 9.390625, 9.83203125, 10.2734375, 10.71484375, 11.15625, 11.59765625, 12.0390625, 12.48046875, 12.921875, 13.36328125, 13.8046875, 14.24609375, 14.6875, 15.12890625, 15.5703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 9.0, 11.0, 14.0, 15.0, 22.0, 51.0, 58.0, 113.0, 153.0, 227.0, 323.0, 542.0, 827.0, 1268.0, 1941.0, 3007.0, 4864.0, 7737.0, 12335.0, 20034.0, 32154.0, 52591.0, 83989.0, 134496.0, 206552.0, 307356.0, 424979.0, 530151.0, 572486.0, 525792.0, 419889.0, 300969.0, 202355.0, 130744.0, 81755.0, 50657.0, 31570.0, 19672.0, 12043.0, 7593.0, 4696.0, 2970.0, 1873.0, 1198.0, 752.0, 492.0, 318.0, 222.0, 156.0, 94.0, 62.0, 41.0, 32.0, 15.0, 10.0, 9.0, 3.0, 3.0, 2.0, 6.0], "bins": [-16.375, -15.8707275390625, -15.366455078125, -14.8621826171875, -14.35791015625, -13.8536376953125, -13.349365234375, -12.8450927734375, -12.3408203125, -11.8365478515625, -11.332275390625, -10.8280029296875, -10.32373046875, -9.8194580078125, -9.315185546875, -8.8109130859375, -8.306640625, -7.8023681640625, -7.298095703125, -6.7938232421875, -6.28955078125, -5.7852783203125, -5.281005859375, -4.7767333984375, -4.2724609375, -3.7681884765625, -3.263916015625, -2.7596435546875, -2.25537109375, -1.7510986328125, -1.246826171875, -0.7425537109375, -0.23828125, 0.2659912109375, 0.770263671875, 1.2745361328125, 1.77880859375, 2.2830810546875, 2.787353515625, 3.2916259765625, 3.7958984375, 4.3001708984375, 4.804443359375, 5.3087158203125, 5.81298828125, 6.3172607421875, 6.821533203125, 7.3258056640625, 7.830078125, 8.3343505859375, 8.838623046875, 9.3428955078125, 9.84716796875, 10.3514404296875, 10.855712890625, 11.3599853515625, 11.8642578125, 12.3685302734375, 12.872802734375, 13.3770751953125, 13.88134765625, 14.3856201171875, 14.889892578125, 15.3941650390625, 15.8984375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 15.0, 15.0, 17.0, 30.0, 24.0, 24.0, 41.0, 47.0, 57.0, 88.0, 104.0, 127.0, 141.0, 183.0, 171.0, 186.0, 219.0, 250.0, 228.0, 255.0, 204.0, 227.0, 198.0, 181.0, 193.0, 134.0, 126.0, 101.0, 86.0, 77.0, 67.0, 46.0, 49.0, 40.0, 20.0, 28.0, 16.0, 8.0, 12.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.19549560546875, -6.9573974609375, -6.71929931640625, -6.481201171875, -6.24310302734375, -6.0050048828125, -5.76690673828125, -5.52880859375, -5.29071044921875, -5.0526123046875, -4.81451416015625, -4.576416015625, -4.33831787109375, -4.1002197265625, -3.86212158203125, -3.6240234375, -3.38592529296875, -3.1478271484375, -2.90972900390625, -2.671630859375, -2.43353271484375, -2.1954345703125, -1.95733642578125, -1.71923828125, -1.48114013671875, -1.2430419921875, -1.00494384765625, -0.766845703125, -0.52874755859375, -0.2906494140625, -0.05255126953125, 0.185546875, 0.42364501953125, 0.6617431640625, 0.89984130859375, 1.137939453125, 1.37603759765625, 1.6141357421875, 1.85223388671875, 2.09033203125, 2.32843017578125, 2.5665283203125, 2.80462646484375, 3.042724609375, 3.28082275390625, 3.5189208984375, 3.75701904296875, 3.9951171875, 4.23321533203125, 4.4713134765625, 4.70941162109375, 4.947509765625, 5.18560791015625, 5.4237060546875, 5.66180419921875, 5.89990234375, 6.13800048828125, 6.3760986328125, 6.61419677734375, 6.852294921875, 7.09039306640625, 7.3284912109375, 7.56658935546875, 7.8046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 10.0, 13.0, 19.0, 17.0, 19.0, 20.0, 17.0, 27.0, 31.0, 28.0, 30.0, 45.0, 50.0, 34.0, 47.0, 53.0, 63.0, 43.0, 52.0, 53.0, 38.0, 34.0, 32.0, 31.0, 29.0, 26.0, 23.0, 18.0, 15.0, 14.0, 7.0, 13.0, 8.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.380870819091797, -17.808752059936523, -17.236631393432617, -16.664512634277344, -16.092391967773438, -15.520273208618164, -14.948153495788574, -14.376033782958984, -13.803914070129395, -13.231794357299805, -12.659674644470215, -12.087554931640625, -11.515436172485352, -10.943315505981445, -10.371196746826172, -9.799077033996582, -9.226957321166992, -8.654837608337402, -8.082717895507812, -7.510598659515381, -6.938478946685791, -6.366359233856201, -5.7942399978637695, -5.22212028503418, -4.65000057220459, -4.077880859375, -3.5057613849639893, -2.9336419105529785, -2.3615221977233887, -1.7894024848937988, -1.217283010482788, -0.6451635360717773, -0.0730438232421875, 0.4990757703781128, 1.071195363998413, 1.6433149576187134, 2.2154345512390137, 2.7875542640686035, 3.3596737384796143, 3.931793212890625, 4.503912925720215, 5.076032638549805, 5.6481523513793945, 6.220271587371826, 6.792391300201416, 7.364511013031006, 7.9366302490234375, 8.508749961853027, 9.080869674682617, 9.652989387512207, 10.225109100341797, 10.797228813171387, 11.369348526000977, 11.94146728515625, 12.51358699798584, 13.08570671081543, 13.65782642364502, 14.22994613647461, 14.8020658493042, 15.374185562133789, 15.946304321289062, 16.51842498779297, 17.090543746948242, 17.662662506103516, 18.234783172607422]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 6.0, 6.0, 4.0, 5.0, 6.0, 10.0, 10.0, 16.0, 14.0, 28.0, 19.0, 15.0, 27.0, 23.0, 24.0, 21.0, 27.0, 34.0, 32.0, 39.0, 36.0, 43.0, 46.0, 41.0, 27.0, 29.0, 42.0, 39.0, 34.0, 34.0, 30.0, 30.0, 21.0, 27.0, 23.0, 21.0, 21.0, 13.0, 15.0, 7.0, 7.0, 6.0, 4.0, 5.0, 4.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.413839340209961, -13.925719261169434, -13.437599182128906, -12.949479103088379, -12.461359024047852, -11.97323989868164, -11.485118865966797, -10.996999740600586, -10.508879661560059, -10.020759582519531, -9.532639503479004, -9.044519424438477, -8.55639934539795, -8.068279266357422, -7.580159664154053, -7.092040061950684, -6.603919506072998, -6.115799427032471, -5.627679347991943, -5.139559745788574, -4.651439666748047, -4.1633195877075195, -3.675199508666992, -3.187079668045044, -2.6989595890045166, -2.2108395099639893, -1.722719669342041, -1.2345995903015137, -0.7464796304702759, -0.2583596706390381, 0.22976040840148926, 0.7178802490234375, 1.2060003280639648, 1.6941202878952026, 2.1822402477264404, 2.6703603267669678, 3.158480167388916, 3.6466002464294434, 4.134720325469971, 4.62283992767334, 5.110960006713867, 5.5990800857543945, 6.087200164794922, 6.575320243835449, 7.063439846038818, 7.551559925079346, 8.039680480957031, 8.527799606323242, 9.015920639038086, 9.504040718078613, 9.99216079711914, 10.480280876159668, 10.968400955200195, 11.456520080566406, 11.94464111328125, 12.432760238647461, 12.920880317687988, 13.409000396728516, 13.897120475769043, 14.38524055480957, 14.873360633850098, 15.361480712890625, 15.849599838256836, 16.33772087097168, 16.82583999633789]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 12.0, 14.0, 19.0, 37.0, 51.0, 93.0, 131.0, 190.0, 292.0, 438.0, 676.0, 1015.0, 1506.0, 2331.0, 3429.0, 5382.0, 7905.0, 11929.0, 17934.0, 25722.0, 36930.0, 51061.0, 68089.0, 85090.0, 100149.0, 108516.0, 108537.0, 99212.0, 83810.0, 66302.0, 49731.0, 35582.0, 24894.0, 17256.0, 11481.0, 7710.0, 5071.0, 3398.0, 2236.0, 1500.0, 1012.0, 663.0, 411.0, 285.0, 169.0, 124.0, 76.0, 55.0, 26.0, 32.0, 19.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.93359375, -6.71661376953125, -6.4996337890625, -6.28265380859375, -6.065673828125, -5.84869384765625, -5.6317138671875, -5.41473388671875, -5.19775390625, -4.98077392578125, -4.7637939453125, -4.54681396484375, -4.329833984375, -4.11285400390625, -3.8958740234375, -3.67889404296875, -3.4619140625, -3.24493408203125, -3.0279541015625, -2.81097412109375, -2.593994140625, -2.37701416015625, -2.1600341796875, -1.94305419921875, -1.72607421875, -1.50909423828125, -1.2921142578125, -1.07513427734375, -0.858154296875, -0.64117431640625, -0.4241943359375, -0.20721435546875, 0.009765625, 0.22674560546875, 0.4437255859375, 0.66070556640625, 0.877685546875, 1.09466552734375, 1.3116455078125, 1.52862548828125, 1.74560546875, 1.96258544921875, 2.1795654296875, 2.39654541015625, 2.613525390625, 2.83050537109375, 3.0474853515625, 3.26446533203125, 3.4814453125, 3.69842529296875, 3.9154052734375, 4.13238525390625, 4.349365234375, 4.56634521484375, 4.7833251953125, 5.00030517578125, 5.21728515625, 5.43426513671875, 5.6512451171875, 5.86822509765625, 6.085205078125, 6.30218505859375, 6.5191650390625, 6.73614501953125, 6.953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 4.0, 6.0, 5.0, 5.0, 10.0, 11.0, 15.0, 15.0, 24.0, 22.0, 15.0, 23.0, 26.0, 24.0, 20.0, 29.0, 32.0, 32.0, 35.0, 39.0, 41.0, 43.0, 46.0, 28.0, 26.0, 45.0, 35.0, 34.0, 35.0, 32.0, 30.0, 21.0, 27.0, 24.0, 21.0, 20.0, 15.0, 14.0, 8.0, 8.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.5703125, -14.0789794921875, -13.587646484375, -13.0963134765625, -12.60498046875, -12.1136474609375, -11.622314453125, -11.1309814453125, -10.6396484375, -10.1483154296875, -9.656982421875, -9.1656494140625, -8.67431640625, -8.1829833984375, -7.691650390625, -7.2003173828125, -6.708984375, -6.2176513671875, -5.726318359375, -5.2349853515625, -4.74365234375, -4.2523193359375, -3.760986328125, -3.2696533203125, -2.7783203125, -2.2869873046875, -1.795654296875, -1.3043212890625, -0.81298828125, -0.3216552734375, 0.169677734375, 0.6610107421875, 1.15234375, 1.6436767578125, 2.135009765625, 2.6263427734375, 3.11767578125, 3.6090087890625, 4.100341796875, 4.5916748046875, 5.0830078125, 5.5743408203125, 6.065673828125, 6.5570068359375, 7.04833984375, 7.5396728515625, 8.031005859375, 8.5223388671875, 9.013671875, 9.5050048828125, 9.996337890625, 10.4876708984375, 10.97900390625, 11.4703369140625, 11.961669921875, 12.4530029296875, 12.9443359375, 13.4356689453125, 13.927001953125, 14.4183349609375, 14.90966796875, 15.4010009765625, 15.892333984375, 16.3836669921875, 16.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 6.0, 6.0, 15.0, 19.0, 28.0, 37.0, 55.0, 84.0, 149.0, 182.0, 295.0, 512.0, 738.0, 1161.0, 1925.0, 3137.0, 5111.0, 8028.0, 13216.0, 21714.0, 41371.0, 709461.0, 167854.0, 28525.0, 17253.0, 10554.0, 6395.0, 3977.0, 2469.0, 1553.0, 981.0, 583.0, 387.0, 259.0, 166.0, 118.0, 55.0, 49.0, 34.0, 36.0, 16.0, 9.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.296875, -15.76708984375, -15.2373046875, -14.70751953125, -14.177734375, -13.64794921875, -13.1181640625, -12.58837890625, -12.05859375, -11.52880859375, -10.9990234375, -10.46923828125, -9.939453125, -9.40966796875, -8.8798828125, -8.35009765625, -7.8203125, -7.29052734375, -6.7607421875, -6.23095703125, -5.701171875, -5.17138671875, -4.6416015625, -4.11181640625, -3.58203125, -3.05224609375, -2.5224609375, -1.99267578125, -1.462890625, -0.93310546875, -0.4033203125, 0.12646484375, 0.65625, 1.18603515625, 1.7158203125, 2.24560546875, 2.775390625, 3.30517578125, 3.8349609375, 4.36474609375, 4.89453125, 5.42431640625, 5.9541015625, 6.48388671875, 7.013671875, 7.54345703125, 8.0732421875, 8.60302734375, 9.1328125, 9.66259765625, 10.1923828125, 10.72216796875, 11.251953125, 11.78173828125, 12.3115234375, 12.84130859375, 13.37109375, 13.90087890625, 14.4306640625, 14.96044921875, 15.490234375, 16.02001953125, 16.5498046875, 17.07958984375, 17.609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 12.0, 8.0, 8.0, 20.0, 19.0, 26.0, 23.0, 23.0, 30.0, 29.0, 29.0, 29.0, 32.0, 39.0, 38.0, 33.0, 41.0, 41.0, 40.0, 34.0, 46.0, 34.0, 37.0, 37.0, 41.0, 32.0, 27.0, 35.0, 10.0, 22.0, 26.0, 14.0, 18.0, 13.0, 12.0, 7.0, 8.0, 2.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.809814453125, -10.40087890625, -9.991943359375, -9.5830078125, -9.174072265625, -8.76513671875, -8.356201171875, -7.947265625, -7.538330078125, -7.12939453125, -6.720458984375, -6.3115234375, -5.902587890625, -5.49365234375, -5.084716796875, -4.67578125, -4.266845703125, -3.85791015625, -3.448974609375, -3.0400390625, -2.631103515625, -2.22216796875, -1.813232421875, -1.404296875, -0.995361328125, -0.58642578125, -0.177490234375, 0.2314453125, 0.640380859375, 1.04931640625, 1.458251953125, 1.8671875, 2.276123046875, 2.68505859375, 3.093994140625, 3.5029296875, 3.911865234375, 4.32080078125, 4.729736328125, 5.138671875, 5.547607421875, 5.95654296875, 6.365478515625, 6.7744140625, 7.183349609375, 7.59228515625, 8.001220703125, 8.41015625, 8.819091796875, 9.22802734375, 9.636962890625, 10.0458984375, 10.454833984375, 10.86376953125, 11.272705078125, 11.681640625, 12.090576171875, 12.49951171875, 12.908447265625, 13.3173828125, 13.726318359375, 14.13525390625, 14.544189453125, 14.953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 7.0, 7.0, 12.0, 24.0, 21.0, 31.0, 36.0, 62.0, 84.0, 118.0, 154.0, 219.0, 317.0, 540.0, 780.0, 1229.0, 1794.0, 2904.0, 4473.0, 7174.0, 11871.0, 20167.0, 45018.0, 670295.0, 208534.0, 30411.0, 16172.0, 9579.0, 5824.0, 3727.0, 2334.0, 1566.0, 1000.0, 621.0, 466.0, 295.0, 191.0, 132.0, 100.0, 70.0, 48.0, 35.0, 28.0, 21.0, 17.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8895797729492188, -0.8597259521484375, -0.8298721313476562, -0.800018310546875, -0.7701644897460938, -0.7403106689453125, -0.7104568481445312, -0.68060302734375, -0.6507492065429688, -0.6208953857421875, -0.5910415649414062, -0.561187744140625, -0.5313339233398438, -0.5014801025390625, -0.47162628173828125, -0.4417724609375, -0.41191864013671875, -0.3820648193359375, -0.35221099853515625, -0.322357177734375, -0.29250335693359375, -0.2626495361328125, -0.23279571533203125, -0.20294189453125, -0.17308807373046875, -0.1432342529296875, -0.11338043212890625, -0.083526611328125, -0.05367279052734375, -0.0238189697265625, 0.00603485107421875, 0.035888671875, 0.06574249267578125, 0.0955963134765625, 0.12545013427734375, 0.155303955078125, 0.18515777587890625, 0.2150115966796875, 0.24486541748046875, 0.27471923828125, 0.30457305908203125, 0.3344268798828125, 0.36428070068359375, 0.394134521484375, 0.42398834228515625, 0.4538421630859375, 0.48369598388671875, 0.5135498046875, 0.5434036254882812, 0.5732574462890625, 0.6031112670898438, 0.632965087890625, 0.6628189086914062, 0.6926727294921875, 0.7225265502929688, 0.75238037109375, 0.7822341918945312, 0.8120880126953125, 0.8419418334960938, 0.871795654296875, 0.9016494750976562, 0.9315032958984375, 0.9613571166992188, 0.9912109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 16.0, 23.0, 24.0, 23.0, 43.0, 46.0, 44.0, 63.0, 46.0, 54.0, 68.0, 72.0, 59.0, 55.0, 47.0, 39.0, 38.0, 38.0, 28.0, 25.0, 20.0, 17.0, 19.0, 9.0, 9.0, 12.0, 7.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0003559589385986328, -0.0003462545573711395, -0.00033655017614364624, -0.00032684579491615295, -0.00031714141368865967, -0.0003074370324611664, -0.0002977326512336731, -0.0002880282700061798, -0.0002783238887786865, -0.00026861950755119324, -0.00025891512632369995, -0.00024921074509620667, -0.00023950636386871338, -0.0002298019826412201, -0.0002200976014137268, -0.00021039322018623352, -0.00020068883895874023, -0.00019098445773124695, -0.00018128007650375366, -0.00017157569527626038, -0.0001618713140487671, -0.0001521669328212738, -0.00014246255159378052, -0.00013275817036628723, -0.00012305378913879395, -0.00011334940791130066, -0.00010364502668380737, -9.394064545631409e-05, -8.42362642288208e-05, -7.453188300132751e-05, -6.482750177383423e-05, -5.512312054634094e-05, -4.5418739318847656e-05, -3.571435809135437e-05, -2.6009976863861084e-05, -1.6305595636367798e-05, -6.601214408874512e-06, 3.1031668186187744e-06, 1.280754804611206e-05, 2.2511929273605347e-05, 3.221631050109863e-05, 4.192069172859192e-05, 5.1625072956085205e-05, 6.132945418357849e-05, 7.103383541107178e-05, 8.073821663856506e-05, 9.044259786605835e-05, 0.00010014697909355164, 0.00010985136032104492, 0.00011955574154853821, 0.0001292601227760315, 0.00013896450400352478, 0.00014866888523101807, 0.00015837326645851135, 0.00016807764768600464, 0.00017778202891349792, 0.0001874864101409912, 0.0001971907913684845, 0.00020689517259597778, 0.00021659955382347107, 0.00022630393505096436, 0.00023600831627845764, 0.00024571269750595093, 0.0002554170787334442, 0.0002651214599609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 11.0, 7.0, 12.0, 25.0, 40.0, 69.0, 118.0, 161.0, 275.0, 432.0, 703.0, 1046.0, 1674.0, 2966.0, 4974.0, 8902.0, 16386.0, 29424.0, 52093.0, 86048.0, 125679.0, 159835.0, 166256.0, 140869.0, 100919.0, 64614.0, 37627.0, 20693.0, 11281.0, 6350.0, 3590.0, 2052.0, 1288.0, 797.0, 489.0, 308.0, 191.0, 128.0, 89.0, 53.0, 27.0, 19.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6536483764648438, -0.6320037841796875, -0.6103591918945312, -0.588714599609375, -0.5670700073242188, -0.5454254150390625, -0.5237808227539062, -0.50213623046875, -0.48049163818359375, -0.4588470458984375, -0.43720245361328125, -0.415557861328125, -0.39391326904296875, -0.3722686767578125, -0.35062408447265625, -0.3289794921875, -0.30733489990234375, -0.2856903076171875, -0.26404571533203125, -0.242401123046875, -0.22075653076171875, -0.1991119384765625, -0.17746734619140625, -0.15582275390625, -0.13417816162109375, -0.1125335693359375, -0.09088897705078125, -0.069244384765625, -0.04759979248046875, -0.0259552001953125, -0.00431060791015625, 0.017333984375, 0.03897857666015625, 0.0606231689453125, 0.08226776123046875, 0.103912353515625, 0.12555694580078125, 0.1472015380859375, 0.16884613037109375, 0.19049072265625, 0.21213531494140625, 0.2337799072265625, 0.25542449951171875, 0.277069091796875, 0.29871368408203125, 0.3203582763671875, 0.34200286865234375, 0.3636474609375, 0.38529205322265625, 0.4069366455078125, 0.42858123779296875, 0.450225830078125, 0.47187042236328125, 0.4935150146484375, 0.5151596069335938, 0.53680419921875, 0.5584487915039062, 0.5800933837890625, 0.6017379760742188, 0.623382568359375, 0.6450271606445312, 0.6666717529296875, 0.6883163452148438, 0.7099609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 0.0, 5.0, 16.0, 14.0, 12.0, 10.0, 17.0, 30.0, 25.0, 30.0, 31.0, 38.0, 41.0, 59.0, 44.0, 47.0, 53.0, 37.0, 56.0, 60.0, 55.0, 35.0, 41.0, 42.0, 34.0, 32.0, 26.0, 16.0, 18.0, 20.0, 7.0, 7.0, 5.0, 8.0, 10.0, 6.0, 1.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.3017253875732422, -0.2936363220214844, -0.28554725646972656, -0.27745819091796875, -0.26936912536621094, -0.2612800598144531, -0.2531909942626953, -0.2451019287109375, -0.2370128631591797, -0.22892379760742188, -0.22083473205566406, -0.21274566650390625, -0.20465660095214844, -0.19656753540039062, -0.1884784698486328, -0.180389404296875, -0.1723003387451172, -0.16421127319335938, -0.15612220764160156, -0.14803314208984375, -0.13994407653808594, -0.13185501098632812, -0.12376594543457031, -0.1156768798828125, -0.10758781433105469, -0.09949874877929688, -0.09140968322753906, -0.08332061767578125, -0.07523155212402344, -0.06714248657226562, -0.05905342102050781, -0.05096435546875, -0.04287528991699219, -0.034786224365234375, -0.026697158813476562, -0.01860809326171875, -0.010519027709960938, -0.002429962158203125, 0.0056591033935546875, 0.0137481689453125, 0.021837234497070312, 0.029926300048828125, 0.03801536560058594, 0.04610443115234375, 0.05419349670410156, 0.062282562255859375, 0.07037162780761719, 0.078460693359375, 0.08654975891113281, 0.09463882446289062, 0.10272789001464844, 0.11081695556640625, 0.11890602111816406, 0.12699508666992188, 0.1350841522216797, 0.1431732177734375, 0.1512622833251953, 0.15935134887695312, 0.16744041442871094, 0.17552947998046875, 0.18361854553222656, 0.19170761108398438, 0.1997966766357422, 0.2078857421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 7.0, 11.0, 10.0, 15.0, 15.0, 12.0, 27.0, 20.0, 25.0, 29.0, 43.0, 30.0, 38.0, 40.0, 56.0, 62.0, 53.0, 51.0, 56.0, 56.0, 52.0, 37.0, 34.0, 34.0, 33.0, 31.0, 19.0, 25.0, 12.0, 10.0, 15.0, 10.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.834659576416016, -21.208133697509766, -20.58160972595215, -19.9550838470459, -19.32855796813965, -18.70203399658203, -18.07550811767578, -17.44898223876953, -16.82245635986328, -16.19593048095703, -15.569405555725098, -14.942880630493164, -14.316354751586914, -13.68982982635498, -13.063304901123047, -12.436779022216797, -11.81025505065918, -11.183730125427246, -10.557204246520996, -9.930679321289062, -9.304153442382812, -8.677628517150879, -8.051103591918945, -7.4245781898498535, -6.798052787780762, -6.17152738571167, -5.545001983642578, -4.9184770584106445, -4.291951656341553, -3.665426254272461, -3.0389010906219482, -2.4123759269714355, -1.7858524322509766, -1.1593271493911743, -0.5328018665313721, 0.09372341632843018, 0.7202486991882324, 1.3467741012573242, 1.973299264907837, 2.5998244285583496, 3.2263498306274414, 3.852875232696533, 4.479400634765625, 5.105925559997559, 5.73245096206665, 6.358976364135742, 6.985501289367676, 7.612026691436768, 8.23855209350586, 8.865077018737793, 9.491602897644043, 10.118127822875977, 10.744653701782227, 11.37117862701416, 11.997703552246094, 12.624229431152344, 13.250754356384277, 13.877279281616211, 14.503805160522461, 15.130330085754395, 15.756855010986328, 16.383380889892578, 17.009906768798828, 17.636430740356445, 18.262956619262695]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 5.0, 4.0, 7.0, 6.0, 11.0, 11.0, 13.0, 22.0, 24.0, 18.0, 18.0, 24.0, 26.0, 25.0, 18.0, 26.0, 29.0, 41.0, 38.0, 32.0, 48.0, 47.0, 35.0, 28.0, 30.0, 43.0, 36.0, 37.0, 29.0, 34.0, 26.0, 19.0, 26.0, 29.0, 22.0, 20.0, 16.0, 7.0, 10.0, 6.0, 7.0, 4.0, 4.0, 3.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.431306838989258, -13.94017219543457, -13.449037551879883, -12.957902908325195, -12.466768264770508, -11.97563362121582, -11.484498977661133, -10.993364334106445, -10.502229690551758, -10.01109504699707, -9.519960403442383, -9.028825759887695, -8.537691116333008, -8.04655647277832, -7.555421352386475, -7.064286708831787, -6.573151588439941, -6.082016944885254, -5.590882301330566, -5.099747657775879, -4.608613014221191, -4.117478370666504, -3.626343250274658, -3.1352086067199707, -2.644073963165283, -2.1529393196105957, -1.6618045568466187, -1.1706697940826416, -0.6795351505279541, -0.1884005069732666, 0.302734375, 0.7938690185546875, 1.285003662109375, 1.7761383056640625, 2.26727294921875, 2.7584078311920166, 3.249542474746704, 3.7406771183013916, 4.231812000274658, 4.722946643829346, 5.214081287384033, 5.705215930938721, 6.196350574493408, 6.687485694885254, 7.178620338439941, 7.669754981994629, 8.160889625549316, 8.652024269104004, 9.143158912658691, 9.634293556213379, 10.125428199768066, 10.616562843322754, 11.107697486877441, 11.598832130432129, 12.089967727661133, 12.58110237121582, 13.072237014770508, 13.563371658325195, 14.054506301879883, 14.54564094543457, 15.036775588989258, 15.527910232543945, 16.019044876098633, 16.51017951965332, 17.001314163208008]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 6.0, 13.0, 19.0, 18.0, 37.0, 71.0, 63.0, 93.0, 171.0, 237.0, 431.0, 674.0, 1075.0, 1613.0, 2364.0, 3789.0, 6129.0, 9363.0, 14690.0, 22374.0, 33977.0, 49812.0, 69530.0, 91986.0, 111359.0, 122277.0, 120661.0, 106459.0, 85080.0, 63590.0, 44436.0, 30201.0, 20041.0, 12868.0, 8275.0, 5309.0, 3338.0, 2179.0, 1459.0, 849.0, 616.0, 360.0, 238.0, 142.0, 91.0, 75.0, 46.0, 29.0, 14.0, 10.0, 8.0, 7.0, 7.0, 1.0, 2.0], "bins": [-17.21875, -16.7247314453125, -16.230712890625, -15.7366943359375, -15.24267578125, -14.7486572265625, -14.254638671875, -13.7606201171875, -13.2666015625, -12.7725830078125, -12.278564453125, -11.7845458984375, -11.29052734375, -10.7965087890625, -10.302490234375, -9.8084716796875, -9.314453125, -8.8204345703125, -8.326416015625, -7.8323974609375, -7.33837890625, -6.8443603515625, -6.350341796875, -5.8563232421875, -5.3623046875, -4.8682861328125, -4.374267578125, -3.8802490234375, -3.38623046875, -2.8922119140625, -2.398193359375, -1.9041748046875, -1.41015625, -0.9161376953125, -0.422119140625, 0.0718994140625, 0.56591796875, 1.0599365234375, 1.553955078125, 2.0479736328125, 2.5419921875, 3.0360107421875, 3.530029296875, 4.0240478515625, 4.51806640625, 5.0120849609375, 5.506103515625, 6.0001220703125, 6.494140625, 6.9881591796875, 7.482177734375, 7.9761962890625, 8.47021484375, 8.9642333984375, 9.458251953125, 9.9522705078125, 10.4462890625, 10.9403076171875, 11.434326171875, 11.9283447265625, 12.42236328125, 12.9163818359375, 13.410400390625, 13.9044189453125, 14.3984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 8.0, 4.0, 8.0, 4.0, 6.0, 10.0, 12.0, 17.0, 18.0, 21.0, 23.0, 17.0, 25.0, 25.0, 25.0, 17.0, 32.0, 30.0, 41.0, 35.0, 38.0, 41.0, 48.0, 34.0, 30.0, 32.0, 41.0, 41.0, 29.0, 36.0, 32.0, 23.0, 19.0, 29.0, 32.0, 16.0, 19.0, 12.0, 10.0, 8.0, 8.0, 6.0, 2.0, 6.0, 5.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.7421875, -13.2718505859375, -12.801513671875, -12.3311767578125, -11.86083984375, -11.3905029296875, -10.920166015625, -10.4498291015625, -9.9794921875, -9.5091552734375, -9.038818359375, -8.5684814453125, -8.09814453125, -7.6278076171875, -7.157470703125, -6.6871337890625, -6.216796875, -5.7464599609375, -5.276123046875, -4.8057861328125, -4.33544921875, -3.8651123046875, -3.394775390625, -2.9244384765625, -2.4541015625, -1.9837646484375, -1.513427734375, -1.0430908203125, -0.57275390625, -0.1024169921875, 0.367919921875, 0.8382568359375, 1.30859375, 1.7789306640625, 2.249267578125, 2.7196044921875, 3.18994140625, 3.6602783203125, 4.130615234375, 4.6009521484375, 5.0712890625, 5.5416259765625, 6.011962890625, 6.4822998046875, 6.95263671875, 7.4229736328125, 7.893310546875, 8.3636474609375, 8.833984375, 9.3043212890625, 9.774658203125, 10.2449951171875, 10.71533203125, 11.1856689453125, 11.656005859375, 12.1263427734375, 12.5966796875, 13.0670166015625, 13.537353515625, 14.0076904296875, 14.47802734375, 14.9483642578125, 15.418701171875, 15.8890380859375, 16.359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 8.0, 14.0, 16.0, 40.0, 55.0, 80.0, 119.0, 207.0, 268.0, 400.0, 601.0, 877.0, 1316.0, 1989.0, 3011.0, 4547.0, 6925.0, 10629.0, 15301.0, 22910.0, 33888.0, 46890.0, 64017.0, 82106.0, 98812.0, 109956.0, 111759.0, 103556.0, 88029.0, 70304.0, 52646.0, 37868.0, 26106.0, 17883.0, 12008.0, 7859.0, 5157.0, 3524.0, 2344.0, 1552.0, 999.0, 699.0, 465.0, 266.0, 178.0, 119.0, 85.0, 63.0, 33.0, 26.0, 18.0, 14.0, 13.0, 5.0, 5.0, 1.0, 1.0], "bins": [-14.953125, -14.5023193359375, -14.051513671875, -13.6007080078125, -13.14990234375, -12.6990966796875, -12.248291015625, -11.7974853515625, -11.3466796875, -10.8958740234375, -10.445068359375, -9.9942626953125, -9.54345703125, -9.0926513671875, -8.641845703125, -8.1910400390625, -7.740234375, -7.2894287109375, -6.838623046875, -6.3878173828125, -5.93701171875, -5.4862060546875, -5.035400390625, -4.5845947265625, -4.1337890625, -3.6829833984375, -3.232177734375, -2.7813720703125, -2.33056640625, -1.8797607421875, -1.428955078125, -0.9781494140625, -0.52734375, -0.0765380859375, 0.374267578125, 0.8250732421875, 1.27587890625, 1.7266845703125, 2.177490234375, 2.6282958984375, 3.0791015625, 3.5299072265625, 3.980712890625, 4.4315185546875, 4.88232421875, 5.3331298828125, 5.783935546875, 6.2347412109375, 6.685546875, 7.1363525390625, 7.587158203125, 8.0379638671875, 8.48876953125, 8.9395751953125, 9.390380859375, 9.8411865234375, 10.2919921875, 10.7427978515625, 11.193603515625, 11.6444091796875, 12.09521484375, 12.5460205078125, 12.996826171875, 13.4476318359375, 13.8984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 8.0, 7.0, 17.0, 12.0, 20.0, 11.0, 21.0, 17.0, 19.0, 23.0, 25.0, 40.0, 26.0, 36.0, 37.0, 50.0, 40.0, 39.0, 42.0, 29.0, 21.0, 33.0, 34.0, 34.0, 39.0, 34.0, 33.0, 38.0, 28.0, 27.0, 22.0, 16.0, 19.0, 18.0, 14.0, 11.0, 6.0, 8.0, 10.0, 4.0, 0.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.3203125, -9.0089111328125, -8.697509765625, -8.3861083984375, -8.07470703125, -7.7633056640625, -7.451904296875, -7.1405029296875, -6.8291015625, -6.5177001953125, -6.206298828125, -5.8948974609375, -5.58349609375, -5.2720947265625, -4.960693359375, -4.6492919921875, -4.337890625, -4.0264892578125, -3.715087890625, -3.4036865234375, -3.09228515625, -2.7808837890625, -2.469482421875, -2.1580810546875, -1.8466796875, -1.5352783203125, -1.223876953125, -0.9124755859375, -0.60107421875, -0.2896728515625, 0.021728515625, 0.3331298828125, 0.64453125, 0.9559326171875, 1.267333984375, 1.5787353515625, 1.89013671875, 2.2015380859375, 2.512939453125, 2.8243408203125, 3.1357421875, 3.4471435546875, 3.758544921875, 4.0699462890625, 4.38134765625, 4.6927490234375, 5.004150390625, 5.3155517578125, 5.626953125, 5.9383544921875, 6.249755859375, 6.5611572265625, 6.87255859375, 7.1839599609375, 7.495361328125, 7.8067626953125, 8.1181640625, 8.4295654296875, 8.740966796875, 9.0523681640625, 9.36376953125, 9.6751708984375, 9.986572265625, 10.2979736328125, 10.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 22.0, 22.0, 46.0, 54.0, 76.0, 95.0, 137.0, 224.0, 304.0, 410.0, 666.0, 957.0, 1567.0, 2429.0, 3845.0, 6200.0, 10393.0, 17582.0, 30467.0, 51236.0, 83823.0, 124740.0, 159503.0, 166247.0, 139122.0, 97363.0, 60941.0, 36443.0, 21142.0, 12530.0, 7464.0, 4558.0, 2720.0, 1761.0, 1109.0, 721.0, 496.0, 351.0, 226.0, 155.0, 114.0, 84.0, 64.0, 37.0, 36.0, 21.0, 10.0, 7.0, 13.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6328125, -6.4266357421875, -6.220458984375, -6.0142822265625, -5.80810546875, -5.6019287109375, -5.395751953125, -5.1895751953125, -4.9833984375, -4.7772216796875, -4.571044921875, -4.3648681640625, -4.15869140625, -3.9525146484375, -3.746337890625, -3.5401611328125, -3.333984375, -3.1278076171875, -2.921630859375, -2.7154541015625, -2.50927734375, -2.3031005859375, -2.096923828125, -1.8907470703125, -1.6845703125, -1.4783935546875, -1.272216796875, -1.0660400390625, -0.85986328125, -0.6536865234375, -0.447509765625, -0.2413330078125, -0.03515625, 0.1710205078125, 0.377197265625, 0.5833740234375, 0.78955078125, 0.9957275390625, 1.201904296875, 1.4080810546875, 1.6142578125, 1.8204345703125, 2.026611328125, 2.2327880859375, 2.43896484375, 2.6451416015625, 2.851318359375, 3.0574951171875, 3.263671875, 3.4698486328125, 3.676025390625, 3.8822021484375, 4.08837890625, 4.2945556640625, 4.500732421875, 4.7069091796875, 4.9130859375, 5.1192626953125, 5.325439453125, 5.5316162109375, 5.73779296875, 5.9439697265625, 6.150146484375, 6.3563232421875, 6.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 13.0, 21.0, 15.0, 28.0, 34.0, 45.0, 44.0, 53.0, 67.0, 89.0, 81.0, 82.0, 74.0, 74.0, 62.0, 48.0, 47.0, 35.0, 21.0, 19.0, 10.0, 11.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008153915405273438, -0.0007837414741516113, -0.0007520914077758789, -0.0007204413414001465, -0.0006887912750244141, -0.0006571412086486816, -0.0006254911422729492, -0.0005938410758972168, -0.0005621910095214844, -0.000530540943145752, -0.0004988908767700195, -0.0004672408103942871, -0.0004355907440185547, -0.00040394067764282227, -0.00037229061126708984, -0.0003406405448913574, -0.000308990478515625, -0.0002773404121398926, -0.00024569034576416016, -0.00021404027938842773, -0.0001823902130126953, -0.0001507401466369629, -0.00011909008026123047, -8.744001388549805e-05, -5.5789947509765625e-05, -2.4139881134033203e-05, 7.510185241699219e-06, 3.916025161743164e-05, 7.081031799316406e-05, 0.00010246038436889648, 0.0001341104507446289, 0.00016576051712036133, 0.00019741058349609375, 0.00022906064987182617, 0.0002607107162475586, 0.000292360782623291, 0.00032401084899902344, 0.00035566091537475586, 0.0003873109817504883, 0.0004189610481262207, 0.0004506111145019531, 0.00048226118087768555, 0.000513911247253418, 0.0005455613136291504, 0.0005772113800048828, 0.0006088614463806152, 0.0006405115127563477, 0.0006721615791320801, 0.0007038116455078125, 0.0007354617118835449, 0.0007671117782592773, 0.0007987618446350098, 0.0008304119110107422, 0.0008620619773864746, 0.000893712043762207, 0.0009253621101379395, 0.0009570121765136719, 0.0009886622428894043, 0.0010203123092651367, 0.0010519623756408691, 0.0010836124420166016, 0.001115262508392334, 0.0011469125747680664, 0.0011785626411437988, 0.0012102127075195312]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 11.0, 14.0, 23.0, 33.0, 59.0, 79.0, 118.0, 174.0, 255.0, 389.0, 553.0, 834.0, 1377.0, 2241.0, 3503.0, 5777.0, 9845.0, 16963.0, 29772.0, 52271.0, 87794.0, 134667.0, 170555.0, 174080.0, 136972.0, 91267.0, 54278.0, 30891.0, 17753.0, 10075.0, 5992.0, 3616.0, 2208.0, 1464.0, 926.0, 531.0, 391.0, 280.0, 152.0, 123.0, 82.0, 58.0, 36.0, 20.0, 19.0, 11.0, 9.0, 2.0, 4.0, 6.0, 2.0], "bins": [-8.390625, -8.15777587890625, -7.9249267578125, -7.69207763671875, -7.459228515625, -7.22637939453125, -6.9935302734375, -6.76068115234375, -6.52783203125, -6.29498291015625, -6.0621337890625, -5.82928466796875, -5.596435546875, -5.36358642578125, -5.1307373046875, -4.89788818359375, -4.6650390625, -4.43218994140625, -4.1993408203125, -3.96649169921875, -3.733642578125, -3.50079345703125, -3.2679443359375, -3.03509521484375, -2.80224609375, -2.56939697265625, -2.3365478515625, -2.10369873046875, -1.870849609375, -1.63800048828125, -1.4051513671875, -1.17230224609375, -0.939453125, -0.70660400390625, -0.4737548828125, -0.24090576171875, -0.008056640625, 0.22479248046875, 0.4576416015625, 0.69049072265625, 0.92333984375, 1.15618896484375, 1.3890380859375, 1.62188720703125, 1.854736328125, 2.08758544921875, 2.3204345703125, 2.55328369140625, 2.7861328125, 3.01898193359375, 3.2518310546875, 3.48468017578125, 3.717529296875, 3.95037841796875, 4.1832275390625, 4.41607666015625, 4.64892578125, 4.88177490234375, 5.1146240234375, 5.34747314453125, 5.580322265625, 5.81317138671875, 6.0460205078125, 6.27886962890625, 6.51171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 2.0, 7.0, 11.0, 14.0, 17.0, 22.0, 23.0, 25.0, 27.0, 30.0, 33.0, 29.0, 45.0, 43.0, 44.0, 57.0, 46.0, 56.0, 46.0, 49.0, 49.0, 52.0, 37.0, 22.0, 35.0, 32.0, 23.0, 23.0, 21.0, 17.0, 11.0, 8.0, 10.0, 3.0, 2.0, 7.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.619140625, -2.54010009765625, -2.4610595703125, -2.38201904296875, -2.302978515625, -2.22393798828125, -2.1448974609375, -2.06585693359375, -1.98681640625, -1.90777587890625, -1.8287353515625, -1.74969482421875, -1.670654296875, -1.59161376953125, -1.5125732421875, -1.43353271484375, -1.3544921875, -1.27545166015625, -1.1964111328125, -1.11737060546875, -1.038330078125, -0.95928955078125, -0.8802490234375, -0.80120849609375, -0.72216796875, -0.64312744140625, -0.5640869140625, -0.48504638671875, -0.406005859375, -0.32696533203125, -0.2479248046875, -0.16888427734375, -0.08984375, -0.01080322265625, 0.0682373046875, 0.14727783203125, 0.226318359375, 0.30535888671875, 0.3843994140625, 0.46343994140625, 0.54248046875, 0.62152099609375, 0.7005615234375, 0.77960205078125, 0.858642578125, 0.93768310546875, 1.0167236328125, 1.09576416015625, 1.1748046875, 1.25384521484375, 1.3328857421875, 1.41192626953125, 1.490966796875, 1.57000732421875, 1.6490478515625, 1.72808837890625, 1.80712890625, 1.88616943359375, 1.9652099609375, 2.04425048828125, 2.123291015625, 2.20233154296875, 2.2813720703125, 2.36041259765625, 2.439453125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 6.0, 4.0, 6.0, 8.0, 9.0, 15.0, 13.0, 11.0, 25.0, 13.0, 37.0, 23.0, 25.0, 28.0, 35.0, 46.0, 48.0, 52.0, 43.0, 38.0, 52.0, 51.0, 50.0, 47.0, 41.0, 33.0, 31.0, 27.0, 31.0, 30.0, 9.0, 17.0, 26.0, 17.0, 11.0, 1.0, 6.0, 6.0, 5.0, 5.0, 1.0, 9.0, 0.0, 3.0, 4.0, 1.0, 3.0, 1.0], "bins": [-19.92853355407715, -19.375043869018555, -18.821556091308594, -18.26806640625, -17.714576721191406, -17.161087036132812, -16.60759925842285, -16.054109573364258, -15.500619888305664, -14.947131156921387, -14.393641471862793, -13.840152740478516, -13.286663055419922, -12.733174324035645, -12.179685592651367, -11.626195907592773, -11.072707176208496, -10.519218444824219, -9.965728759765625, -9.412240028381348, -8.858750343322754, -8.305261611938477, -7.751772403717041, -7.1982831954956055, -6.64479398727417, -6.091304779052734, -5.537815570831299, -4.984326362609863, -4.430837631225586, -3.8773481845855713, -3.323859214782715, -2.7703700065612793, -2.2168807983398438, -1.6633915901184082, -1.1099025011062622, -0.5564134120941162, -0.002924203872680664, 0.5505650043487549, 1.1040539741516113, 1.6575431823730469, 2.2110323905944824, 2.764521598815918, 3.3180108070373535, 3.87149977684021, 4.424988746643066, 4.97847843170166, 5.5319671630859375, 6.085456371307373, 6.638945579528809, 7.192434787750244, 7.74592399597168, 8.299412727355957, 8.85290241241455, 9.406391143798828, 9.959880828857422, 10.5133695602417, 11.066858291625977, 11.620347023010254, 12.173836708068848, 12.727325439453125, 13.280815124511719, 13.834303855895996, 14.387792587280273, 14.941282272338867, 15.494771957397461]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 10.0, 8.0, 14.0, 11.0, 19.0, 10.0, 19.0, 11.0, 28.0, 26.0, 28.0, 26.0, 37.0, 28.0, 36.0, 32.0, 28.0, 37.0, 39.0, 41.0, 32.0, 50.0, 43.0, 28.0, 23.0, 46.0, 30.0, 28.0, 29.0, 29.0, 16.0, 16.0, 17.0, 14.0, 23.0, 17.0, 10.0, 10.0, 9.0, 4.0, 4.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.991277694702148, -14.489485740661621, -13.987693786621094, -13.485901832580566, -12.984109878540039, -12.482318878173828, -11.9805269241333, -11.478734970092773, -10.976943016052246, -10.475151062011719, -9.973359107971191, -9.471567153930664, -8.969776153564453, -8.46798324584961, -7.966192245483398, -7.464400291442871, -6.962608337402344, -6.460816383361816, -5.959024429321289, -5.45723295211792, -4.955440998077393, -4.453649044036865, -3.951857328414917, -3.4500656127929688, -2.9482736587524414, -2.446481704711914, -1.9446899890899658, -1.442898154258728, -0.9411063194274902, -0.4393143653869629, 0.06247735023498535, 0.5642690658569336, 1.0660591125488281, 1.567850947380066, 2.0696427822113037, 2.571434497833252, 3.0732264518737793, 3.5750184059143066, 4.076809883117676, 4.578601837158203, 5.0803937911987305, 5.582185745239258, 6.083977699279785, 6.585769176483154, 7.087561130523682, 7.589353084564209, 8.091144561767578, 8.592936515808105, 9.094728469848633, 9.59652042388916, 10.098312377929688, 10.600104331970215, 11.101896286010742, 11.603687286376953, 12.10547924041748, 12.607271194458008, 13.109063148498535, 13.610855102539062, 14.11264705657959, 14.614439010620117, 15.116230010986328, 15.618022918701172, 16.119813919067383, 16.621604919433594, 17.123397827148438]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 10.0, 10.0, 17.0, 32.0, 47.0, 64.0, 102.0, 182.0, 195.0, 390.0, 586.0, 865.0, 1405.0, 2198.0, 3631.0, 5606.0, 9228.0, 15276.0, 25292.0, 43179.0, 73530.0, 127043.0, 216126.0, 352708.0, 519330.0, 649089.0, 659019.0, 542114.0, 377116.0, 234385.0, 138404.0, 80785.0, 46706.0, 27413.0, 16171.0, 9939.0, 6081.0, 3702.0, 2306.0, 1471.0, 928.0, 551.0, 371.0, 243.0, 175.0, 90.0, 63.0, 35.0, 29.0, 25.0, 4.0, 13.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.828125, -16.3193359375, -15.810546875, -15.3017578125, -14.79296875, -14.2841796875, -13.775390625, -13.2666015625, -12.7578125, -12.2490234375, -11.740234375, -11.2314453125, -10.72265625, -10.2138671875, -9.705078125, -9.1962890625, -8.6875, -8.1787109375, -7.669921875, -7.1611328125, -6.65234375, -6.1435546875, -5.634765625, -5.1259765625, -4.6171875, -4.1083984375, -3.599609375, -3.0908203125, -2.58203125, -2.0732421875, -1.564453125, -1.0556640625, -0.546875, -0.0380859375, 0.470703125, 0.9794921875, 1.48828125, 1.9970703125, 2.505859375, 3.0146484375, 3.5234375, 4.0322265625, 4.541015625, 5.0498046875, 5.55859375, 6.0673828125, 6.576171875, 7.0849609375, 7.59375, 8.1025390625, 8.611328125, 9.1201171875, 9.62890625, 10.1376953125, 10.646484375, 11.1552734375, 11.6640625, 12.1728515625, 12.681640625, 13.1904296875, 13.69921875, 14.2080078125, 14.716796875, 15.2255859375, 15.734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 6.0, 7.0, 16.0, 14.0, 15.0, 10.0, 19.0, 19.0, 24.0, 26.0, 20.0, 30.0, 33.0, 32.0, 38.0, 24.0, 34.0, 43.0, 35.0, 40.0, 41.0, 36.0, 42.0, 38.0, 27.0, 40.0, 33.0, 21.0, 32.0, 28.0, 23.0, 19.0, 13.0, 15.0, 18.0, 11.0, 16.0, 12.0, 8.0, 6.0, 2.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.3558349609375, -11.914794921875, -11.4737548828125, -11.03271484375, -10.5916748046875, -10.150634765625, -9.7095947265625, -9.2685546875, -8.8275146484375, -8.386474609375, -7.9454345703125, -7.50439453125, -7.0633544921875, -6.622314453125, -6.1812744140625, -5.740234375, -5.2991943359375, -4.858154296875, -4.4171142578125, -3.97607421875, -3.5350341796875, -3.093994140625, -2.6529541015625, -2.2119140625, -1.7708740234375, -1.329833984375, -0.8887939453125, -0.44775390625, -0.0067138671875, 0.434326171875, 0.8753662109375, 1.31640625, 1.7574462890625, 2.198486328125, 2.6395263671875, 3.08056640625, 3.5216064453125, 3.962646484375, 4.4036865234375, 4.8447265625, 5.2857666015625, 5.726806640625, 6.1678466796875, 6.60888671875, 7.0499267578125, 7.490966796875, 7.9320068359375, 8.373046875, 8.8140869140625, 9.255126953125, 9.6961669921875, 10.13720703125, 10.5782470703125, 11.019287109375, 11.4603271484375, 11.9013671875, 12.3424072265625, 12.783447265625, 13.2244873046875, 13.66552734375, 14.1065673828125, 14.547607421875, 14.9886474609375, 15.4296875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 10.0, 19.0, 27.0, 50.0, 59.0, 135.0, 181.0, 281.0, 416.0, 675.0, 1021.0, 1577.0, 2374.0, 3709.0, 5747.0, 9020.0, 14345.0, 23171.0, 36682.0, 58229.0, 92301.0, 144130.0, 218827.0, 317519.0, 427718.0, 519981.0, 552900.0, 504110.0, 405549.0, 294484.0, 200967.0, 131265.0, 83926.0, 53030.0, 33369.0, 20637.0, 12965.0, 8235.0, 5113.0, 3394.0, 2137.0, 1379.0, 906.0, 600.0, 388.0, 236.0, 139.0, 113.0, 72.0, 56.0, 39.0, 23.0, 10.0, 13.0, 4.0, 6.0, 4.0, 2.0], "bins": [-15.453125, -14.97607421875, -14.4990234375, -14.02197265625, -13.544921875, -13.06787109375, -12.5908203125, -12.11376953125, -11.63671875, -11.15966796875, -10.6826171875, -10.20556640625, -9.728515625, -9.25146484375, -8.7744140625, -8.29736328125, -7.8203125, -7.34326171875, -6.8662109375, -6.38916015625, -5.912109375, -5.43505859375, -4.9580078125, -4.48095703125, -4.00390625, -3.52685546875, -3.0498046875, -2.57275390625, -2.095703125, -1.61865234375, -1.1416015625, -0.66455078125, -0.1875, 0.28955078125, 0.7666015625, 1.24365234375, 1.720703125, 2.19775390625, 2.6748046875, 3.15185546875, 3.62890625, 4.10595703125, 4.5830078125, 5.06005859375, 5.537109375, 6.01416015625, 6.4912109375, 6.96826171875, 7.4453125, 7.92236328125, 8.3994140625, 8.87646484375, 9.353515625, 9.83056640625, 10.3076171875, 10.78466796875, 11.26171875, 11.73876953125, 12.2158203125, 12.69287109375, 13.169921875, 13.64697265625, 14.1240234375, 14.60107421875, 15.078125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 6.0, 10.0, 8.0, 23.0, 13.0, 19.0, 24.0, 44.0, 41.0, 61.0, 46.0, 74.0, 95.0, 98.0, 80.0, 122.0, 138.0, 154.0, 150.0, 191.0, 202.0, 199.0, 217.0, 211.0, 219.0, 181.0, 168.0, 152.0, 153.0, 125.0, 129.0, 117.0, 89.0, 88.0, 77.0, 68.0, 51.0, 37.0, 32.0, 22.0, 23.0, 30.0, 22.0, 15.0, 13.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-6.265625, -6.06707763671875, -5.8685302734375, -5.66998291015625, -5.471435546875, -5.27288818359375, -5.0743408203125, -4.87579345703125, -4.67724609375, -4.47869873046875, -4.2801513671875, -4.08160400390625, -3.883056640625, -3.68450927734375, -3.4859619140625, -3.28741455078125, -3.0888671875, -2.89031982421875, -2.6917724609375, -2.49322509765625, -2.294677734375, -2.09613037109375, -1.8975830078125, -1.69903564453125, -1.50048828125, -1.30194091796875, -1.1033935546875, -0.90484619140625, -0.706298828125, -0.50775146484375, -0.3092041015625, -0.11065673828125, 0.087890625, 0.28643798828125, 0.4849853515625, 0.68353271484375, 0.882080078125, 1.08062744140625, 1.2791748046875, 1.47772216796875, 1.67626953125, 1.87481689453125, 2.0733642578125, 2.27191162109375, 2.470458984375, 2.66900634765625, 2.8675537109375, 3.06610107421875, 3.2646484375, 3.46319580078125, 3.6617431640625, 3.86029052734375, 4.058837890625, 4.25738525390625, 4.4559326171875, 4.65447998046875, 4.85302734375, 5.05157470703125, 5.2501220703125, 5.44866943359375, 5.647216796875, 5.84576416015625, 6.0443115234375, 6.24285888671875, 6.44140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 9.0, 14.0, 16.0, 18.0, 15.0, 11.0, 27.0, 25.0, 34.0, 37.0, 52.0, 45.0, 48.0, 49.0, 60.0, 57.0, 46.0, 68.0, 53.0, 45.0, 37.0, 35.0, 37.0, 21.0, 27.0, 22.0, 13.0, 17.0, 9.0, 10.0, 3.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.549909591674805, -21.91442108154297, -21.278934478759766, -20.64344596862793, -20.007957458496094, -19.37247085571289, -18.736982345581055, -18.10149383544922, -17.466007232666016, -16.83051872253418, -16.195032119750977, -15.55954360961914, -14.924055099487305, -14.288567543029785, -13.653079986572266, -13.01759147644043, -12.382102966308594, -11.746615409851074, -11.111126899719238, -10.475639343261719, -9.840150833129883, -9.204663276672363, -8.569175720214844, -7.933687686920166, -7.298199653625488, -6.6627116203308105, -6.027223587036133, -5.391736030578613, -4.7562479972839355, -4.120759963989258, -3.485272169113159, -2.8497843742370605, -2.21429443359375, -1.5788065195083618, -0.9433186054229736, -0.30783069133758545, 0.32765722274780273, 0.9631452560424805, 1.598633050918579, 2.2341208457946777, 2.8696088790893555, 3.505096912384033, 4.140584945678711, 4.7760725021362305, 5.411560535430908, 6.047048568725586, 6.6825361251831055, 7.318024158477783, 7.953512191772461, 8.58899974822998, 9.224488258361816, 9.859975814819336, 10.495464324951172, 11.130951881408691, 11.766439437866211, 12.401927947998047, 13.037415504455566, 13.672903060913086, 14.308391571044922, 14.943879127502441, 15.579366683959961, 16.214855194091797, 16.850343704223633, 17.485830307006836, 18.121318817138672]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 5.0, 6.0, 7.0, 11.0, 12.0, 14.0, 9.0, 15.0, 23.0, 26.0, 29.0, 25.0, 30.0, 36.0, 33.0, 40.0, 33.0, 32.0, 35.0, 42.0, 46.0, 42.0, 37.0, 29.0, 35.0, 28.0, 32.0, 35.0, 27.0, 22.0, 33.0, 28.0, 24.0, 11.0, 19.0, 15.0, 11.0, 12.0, 7.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-16.6811466217041, -16.18553924560547, -15.689933776855469, -15.194326400756836, -14.69871997833252, -14.203113555908203, -13.707507133483887, -13.21190071105957, -12.716293334960938, -12.220686912536621, -11.725080490112305, -11.229473114013672, -10.733866691589355, -10.238260269165039, -9.742653846740723, -9.247047424316406, -8.75144100189209, -8.255834579467773, -7.760227680206299, -7.264621257781982, -6.769014358520508, -6.273407936096191, -5.777801513671875, -5.282195091247559, -4.786588191986084, -4.290981769561768, -3.795374870300293, -3.2997684478759766, -2.804161787033081, -2.3085551261901855, -1.8129487037658691, -1.3173420429229736, -0.8217363357543945, -0.3261297345161438, 0.16947686672210693, 0.6650834083557129, 1.1606900691986084, 1.656296730041504, 2.1519031524658203, 2.647509813308716, 3.1431164741516113, 3.638723134994507, 4.134329795837402, 4.629936218261719, 5.125542640686035, 5.62114953994751, 6.116755962371826, 6.612362861633301, 7.107969284057617, 7.603575706481934, 8.09918212890625, 8.594789505004883, 9.0903959274292, 9.586002349853516, 10.081608772277832, 10.577215194702148, 11.072822570800781, 11.568428993225098, 12.064035415649414, 12.559642791748047, 13.055249214172363, 13.55085563659668, 14.046462059020996, 14.542068481445312, 15.037674903869629]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 8.0, 15.0, 21.0, 27.0, 57.0, 73.0, 108.0, 174.0, 273.0, 435.0, 685.0, 1134.0, 1871.0, 2984.0, 5087.0, 8387.0, 13579.0, 21903.0, 35126.0, 53589.0, 78417.0, 105274.0, 128774.0, 137491.0, 127945.0, 104704.0, 77275.0, 52625.0, 34315.0, 21924.0, 13222.0, 8233.0, 5020.0, 2982.0, 1833.0, 1132.0, 673.0, 434.0, 247.0, 139.0, 124.0, 63.0, 48.0, 29.0, 29.0, 14.0, 16.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-6.75390625, -6.53936767578125, -6.3248291015625, -6.11029052734375, -5.895751953125, -5.68121337890625, -5.4666748046875, -5.25213623046875, -5.03759765625, -4.82305908203125, -4.6085205078125, -4.39398193359375, -4.179443359375, -3.96490478515625, -3.7503662109375, -3.53582763671875, -3.3212890625, -3.10675048828125, -2.8922119140625, -2.67767333984375, -2.463134765625, -2.24859619140625, -2.0340576171875, -1.81951904296875, -1.60498046875, -1.39044189453125, -1.1759033203125, -0.96136474609375, -0.746826171875, -0.53228759765625, -0.3177490234375, -0.10321044921875, 0.111328125, 0.32586669921875, 0.5404052734375, 0.75494384765625, 0.969482421875, 1.18402099609375, 1.3985595703125, 1.61309814453125, 1.82763671875, 2.04217529296875, 2.2567138671875, 2.47125244140625, 2.685791015625, 2.90032958984375, 3.1148681640625, 3.32940673828125, 3.5439453125, 3.75848388671875, 3.9730224609375, 4.18756103515625, 4.402099609375, 4.61663818359375, 4.8311767578125, 5.04571533203125, 5.26025390625, 5.47479248046875, 5.6893310546875, 5.90386962890625, 6.118408203125, 6.33294677734375, 6.5474853515625, 6.76202392578125, 6.9765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 8.0, 5.0, 5.0, 8.0, 11.0, 12.0, 15.0, 8.0, 16.0, 23.0, 27.0, 25.0, 28.0, 33.0, 34.0, 33.0, 33.0, 34.0, 37.0, 34.0, 41.0, 44.0, 42.0, 35.0, 30.0, 37.0, 28.0, 30.0, 36.0, 25.0, 25.0, 29.0, 32.0, 18.0, 14.0, 22.0, 16.0, 12.0, 9.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-16.640625, -16.1446533203125, -15.648681640625, -15.1527099609375, -14.65673828125, -14.1607666015625, -13.664794921875, -13.1688232421875, -12.6728515625, -12.1768798828125, -11.680908203125, -11.1849365234375, -10.68896484375, -10.1929931640625, -9.697021484375, -9.2010498046875, -8.705078125, -8.2091064453125, -7.713134765625, -7.2171630859375, -6.72119140625, -6.2252197265625, -5.729248046875, -5.2332763671875, -4.7373046875, -4.2413330078125, -3.745361328125, -3.2493896484375, -2.75341796875, -2.2574462890625, -1.761474609375, -1.2655029296875, -0.76953125, -0.2735595703125, 0.222412109375, 0.7183837890625, 1.21435546875, 1.7103271484375, 2.206298828125, 2.7022705078125, 3.1982421875, 3.6942138671875, 4.190185546875, 4.6861572265625, 5.18212890625, 5.6781005859375, 6.174072265625, 6.6700439453125, 7.166015625, 7.6619873046875, 8.157958984375, 8.6539306640625, 9.14990234375, 9.6458740234375, 10.141845703125, 10.6378173828125, 11.1337890625, 11.6297607421875, 12.125732421875, 12.6217041015625, 13.11767578125, 13.6136474609375, 14.109619140625, 14.6055908203125, 15.1015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 14.0, 13.0, 12.0, 24.0, 44.0, 45.0, 75.0, 122.0, 208.0, 319.0, 520.0, 885.0, 1575.0, 2887.0, 5336.0, 9895.0, 18874.0, 38503.0, 793631.0, 118256.0, 27021.0, 13791.0, 7293.0, 4008.0, 2217.0, 1174.0, 690.0, 407.0, 242.0, 160.0, 94.0, 64.0, 34.0, 41.0, 20.0, 17.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.8359375, -18.203125, -17.5703125, -16.9375, -16.3046875, -15.671875, -15.0390625, -14.40625, -13.7734375, -13.140625, -12.5078125, -11.875, -11.2421875, -10.609375, -9.9765625, -9.34375, -8.7109375, -8.078125, -7.4453125, -6.8125, -6.1796875, -5.546875, -4.9140625, -4.28125, -3.6484375, -3.015625, -2.3828125, -1.75, -1.1171875, -0.484375, 0.1484375, 0.78125, 1.4140625, 2.046875, 2.6796875, 3.3125, 3.9453125, 4.578125, 5.2109375, 5.84375, 6.4765625, 7.109375, 7.7421875, 8.375, 9.0078125, 9.640625, 10.2734375, 10.90625, 11.5390625, 12.171875, 12.8046875, 13.4375, 14.0703125, 14.703125, 15.3359375, 15.96875, 16.6015625, 17.234375, 17.8671875, 18.5, 19.1328125, 19.765625, 20.3984375, 21.03125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 11.0, 18.0, 21.0, 18.0, 19.0, 21.0, 39.0, 33.0, 27.0, 37.0, 39.0, 42.0, 48.0, 52.0, 44.0, 36.0, 41.0, 43.0, 49.0, 49.0, 37.0, 30.0, 31.0, 34.0, 23.0, 20.0, 28.0, 19.0, 16.0, 8.0, 10.0, 7.0, 6.0, 5.0, 7.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.5811767578125, -11.170166015625, -10.7591552734375, -10.34814453125, -9.9371337890625, -9.526123046875, -9.1151123046875, -8.7041015625, -8.2930908203125, -7.882080078125, -7.4710693359375, -7.06005859375, -6.6490478515625, -6.238037109375, -5.8270263671875, -5.416015625, -5.0050048828125, -4.593994140625, -4.1829833984375, -3.77197265625, -3.3609619140625, -2.949951171875, -2.5389404296875, -2.1279296875, -1.7169189453125, -1.305908203125, -0.8948974609375, -0.48388671875, -0.0728759765625, 0.338134765625, 0.7491455078125, 1.16015625, 1.5711669921875, 1.982177734375, 2.3931884765625, 2.80419921875, 3.2152099609375, 3.626220703125, 4.0372314453125, 4.4482421875, 4.8592529296875, 5.270263671875, 5.6812744140625, 6.09228515625, 6.5032958984375, 6.914306640625, 7.3253173828125, 7.736328125, 8.1473388671875, 8.558349609375, 8.9693603515625, 9.38037109375, 9.7913818359375, 10.202392578125, 10.6134033203125, 11.0244140625, 11.4354248046875, 11.846435546875, 12.2574462890625, 12.66845703125, 13.0794677734375, 13.490478515625, 13.9014892578125, 14.3125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 14.0, 14.0, 22.0, 46.0, 41.0, 60.0, 94.0, 139.0, 191.0, 351.0, 541.0, 969.0, 1992.0, 4254.0, 10378.0, 29779.0, 781047.0, 180566.0, 22304.0, 8289.0, 3525.0, 1645.0, 906.0, 500.0, 273.0, 174.0, 134.0, 75.0, 58.0, 31.0, 22.0, 15.0, 18.0, 14.0, 16.0, 4.0, 6.0, 10.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.404296875, -2.3311767578125, -2.258056640625, -2.1849365234375, -2.11181640625, -2.0386962890625, -1.965576171875, -1.8924560546875, -1.8193359375, -1.7462158203125, -1.673095703125, -1.5999755859375, -1.52685546875, -1.4537353515625, -1.380615234375, -1.3074951171875, -1.234375, -1.1612548828125, -1.088134765625, -1.0150146484375, -0.94189453125, -0.8687744140625, -0.795654296875, -0.7225341796875, -0.6494140625, -0.5762939453125, -0.503173828125, -0.4300537109375, -0.35693359375, -0.2838134765625, -0.210693359375, -0.1375732421875, -0.064453125, 0.0086669921875, 0.081787109375, 0.1549072265625, 0.22802734375, 0.3011474609375, 0.374267578125, 0.4473876953125, 0.5205078125, 0.5936279296875, 0.666748046875, 0.7398681640625, 0.81298828125, 0.8861083984375, 0.959228515625, 1.0323486328125, 1.10546875, 1.1785888671875, 1.251708984375, 1.3248291015625, 1.39794921875, 1.4710693359375, 1.544189453125, 1.6173095703125, 1.6904296875, 1.7635498046875, 1.836669921875, 1.9097900390625, 1.98291015625, 2.0560302734375, 2.129150390625, 2.2022705078125, 2.275390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 15.0, 15.0, 13.0, 15.0, 13.0, 20.0, 28.0, 36.0, 28.0, 44.0, 69.0, 52.0, 60.0, 59.0, 66.0, 59.0, 51.0, 50.0, 32.0, 47.0, 44.0, 26.0, 25.0, 18.0, 9.0, 12.0, 12.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.00018978118896484375, -0.000184500589966774, -0.00017921999096870422, -0.00017393939197063446, -0.0001686587929725647, -0.00016337819397449493, -0.00015809759497642517, -0.0001528169959783554, -0.00014753639698028564, -0.00014225579798221588, -0.00013697519898414612, -0.00013169459998607635, -0.0001264140009880066, -0.00012113340198993683, -0.00011585280299186707, -0.0001105722039937973, -0.00010529160499572754, -0.00010001100599765778, -9.473040699958801e-05, -8.944980800151825e-05, -8.416920900344849e-05, -7.888861000537872e-05, -7.360801100730896e-05, -6.83274120092392e-05, -6.304681301116943e-05, -5.776621401309967e-05, -5.248561501502991e-05, -4.7205016016960144e-05, -4.192441701889038e-05, -3.664381802082062e-05, -3.1363219022750854e-05, -2.608262002468109e-05, -2.0802021026611328e-05, -1.5521422028541565e-05, -1.0240823030471802e-05, -4.9602240324020386e-06, 3.203749656677246e-07, 5.600973963737488e-06, 1.0881572961807251e-05, 1.6162171959877014e-05, 2.1442770957946777e-05, 2.672336995601654e-05, 3.2003968954086304e-05, 3.728456795215607e-05, 4.256516695022583e-05, 4.784576594829559e-05, 5.3126364946365356e-05, 5.840696394443512e-05, 6.368756294250488e-05, 6.896816194057465e-05, 7.424876093864441e-05, 7.952935993671417e-05, 8.480995893478394e-05, 9.00905579328537e-05, 9.537115693092346e-05, 0.00010065175592899323, 0.00010593235492706299, 0.00011121295392513275, 0.00011649355292320251, 0.00012177415192127228, 0.00012705475091934204, 0.0001323353499174118, 0.00013761594891548157, 0.00014289654791355133, 0.0001481771469116211]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 10.0, 15.0, 23.0, 24.0, 31.0, 47.0, 77.0, 91.0, 120.0, 160.0, 259.0, 322.0, 446.0, 631.0, 902.0, 1235.0, 1797.0, 2650.0, 4159.0, 6686.0, 12521.0, 26132.0, 61765.0, 146102.0, 258523.0, 257651.0, 145916.0, 61961.0, 26078.0, 12415.0, 6864.0, 4008.0, 2700.0, 1759.0, 1275.0, 903.0, 597.0, 453.0, 321.0, 266.0, 202.0, 113.0, 95.0, 70.0, 37.0, 45.0, 31.0, 26.0, 14.0, 10.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.435546875, -1.39068603515625, -1.3458251953125, -1.30096435546875, -1.256103515625, -1.21124267578125, -1.1663818359375, -1.12152099609375, -1.07666015625, -1.03179931640625, -0.9869384765625, -0.94207763671875, -0.897216796875, -0.85235595703125, -0.8074951171875, -0.76263427734375, -0.7177734375, -0.67291259765625, -0.6280517578125, -0.58319091796875, -0.538330078125, -0.49346923828125, -0.4486083984375, -0.40374755859375, -0.35888671875, -0.31402587890625, -0.2691650390625, -0.22430419921875, -0.179443359375, -0.13458251953125, -0.0897216796875, -0.04486083984375, 0.0, 0.04486083984375, 0.0897216796875, 0.13458251953125, 0.179443359375, 0.22430419921875, 0.2691650390625, 0.31402587890625, 0.35888671875, 0.40374755859375, 0.4486083984375, 0.49346923828125, 0.538330078125, 0.58319091796875, 0.6280517578125, 0.67291259765625, 0.7177734375, 0.76263427734375, 0.8074951171875, 0.85235595703125, 0.897216796875, 0.94207763671875, 0.9869384765625, 1.03179931640625, 1.07666015625, 1.12152099609375, 1.1663818359375, 1.21124267578125, 1.256103515625, 1.30096435546875, 1.3458251953125, 1.39068603515625, 1.435546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 13.0, 12.0, 25.0, 19.0, 27.0, 37.0, 43.0, 53.0, 57.0, 73.0, 85.0, 69.0, 66.0, 66.0, 67.0, 46.0, 50.0, 34.0, 18.0, 19.0, 13.0, 16.0, 13.0, 9.0, 9.0, 7.0, 3.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46630859375, -0.4535064697265625, -0.440704345703125, -0.4279022216796875, -0.41510009765625, -0.4022979736328125, -0.389495849609375, -0.3766937255859375, -0.3638916015625, -0.3510894775390625, -0.338287353515625, -0.3254852294921875, -0.31268310546875, -0.2998809814453125, -0.287078857421875, -0.2742767333984375, -0.261474609375, -0.2486724853515625, -0.235870361328125, -0.2230682373046875, -0.21026611328125, -0.1974639892578125, -0.184661865234375, -0.1718597412109375, -0.1590576171875, -0.1462554931640625, -0.133453369140625, -0.1206512451171875, -0.10784912109375, -0.0950469970703125, -0.082244873046875, -0.0694427490234375, -0.056640625, -0.0438385009765625, -0.031036376953125, -0.0182342529296875, -0.00543212890625, 0.0073699951171875, 0.020172119140625, 0.0329742431640625, 0.0457763671875, 0.0585784912109375, 0.071380615234375, 0.0841827392578125, 0.09698486328125, 0.1097869873046875, 0.122589111328125, 0.1353912353515625, 0.148193359375, 0.1609954833984375, 0.173797607421875, 0.1865997314453125, 0.19940185546875, 0.2122039794921875, 0.225006103515625, 0.2378082275390625, 0.2506103515625, 0.2634124755859375, 0.276214599609375, 0.2890167236328125, 0.30181884765625, 0.3146209716796875, 0.327423095703125, 0.3402252197265625, 0.35302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 14.0, 7.0, 10.0, 8.0, 7.0, 23.0, 16.0, 20.0, 30.0, 38.0, 30.0, 40.0, 39.0, 40.0, 53.0, 61.0, 53.0, 50.0, 61.0, 44.0, 59.0, 39.0, 37.0, 31.0, 41.0, 28.0, 17.0, 19.0, 18.0, 14.0, 11.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-22.50246810913086, -21.878021240234375, -21.25357437133789, -20.62912940979004, -20.004682540893555, -19.38023567199707, -18.755788803100586, -18.131343841552734, -17.50689697265625, -16.882450103759766, -16.25800323486328, -15.633557319641113, -15.009111404418945, -14.384664535522461, -13.760217666625977, -13.135771751403809, -12.511324882507324, -11.88687801361084, -11.262432098388672, -10.637985229492188, -10.01353931427002, -9.389092445373535, -8.764646530151367, -8.140199661254883, -7.515753269195557, -6.8913068771362305, -6.266860485076904, -5.642414093017578, -5.017967224121094, -4.393521308898926, -3.7690744400024414, -3.1446280479431152, -2.520181655883789, -1.895735263824463, -1.2712887525558472, -0.6468422412872314, -0.022395849227905273, 0.6020505428314209, 1.2264971733093262, 1.8509435653686523, 2.4753899574279785, 3.0998363494873047, 3.724282741546631, 4.348729133605957, 4.973176002502441, 5.597621917724609, 6.222068786621094, 6.84651517868042, 7.470961570739746, 8.09540843963623, 8.719854354858398, 9.344301223754883, 9.96874713897705, 10.593194007873535, 11.217639923095703, 11.842086791992188, 12.466533660888672, 13.090980529785156, 13.715426445007324, 14.339873313903809, 14.964319229125977, 15.588766098022461, 16.213212966918945, 16.837657928466797, 17.46210479736328]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 4.0, 7.0, 11.0, 11.0, 11.0, 12.0, 13.0, 20.0, 21.0, 28.0, 21.0, 25.0, 36.0, 30.0, 32.0, 36.0, 35.0, 34.0, 35.0, 47.0, 36.0, 44.0, 35.0, 35.0, 32.0, 29.0, 27.0, 33.0, 28.0, 22.0, 27.0, 33.0, 24.0, 12.0, 20.0, 15.0, 13.0, 12.0, 8.0, 3.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-16.397401809692383, -15.907699584960938, -15.417997360229492, -14.928296089172363, -14.438593864440918, -13.948891639709473, -13.459190368652344, -12.969488143920898, -12.479785919189453, -11.990083694458008, -11.500381469726562, -11.010680198669434, -10.520977973937988, -10.031275749206543, -9.541574478149414, -9.051872253417969, -8.562170028686523, -8.072467803955078, -7.582766056060791, -7.093064308166504, -6.603362083435059, -6.113659858703613, -5.623958110809326, -5.134256362915039, -4.644554138183594, -4.154851913452148, -3.6651501655578613, -3.175448179244995, -2.685746192932129, -2.1960442066192627, -1.7063422203063965, -1.2166402339935303, -0.7269392013549805, -0.23723721504211426, 0.25246477127075195, 0.7421667575836182, 1.2318687438964844, 1.7215707302093506, 2.211272716522217, 2.700974702835083, 3.190676689147949, 3.6803786754608154, 4.170080661773682, 4.659782409667969, 5.149484634399414, 5.639186859130859, 6.1288886070251465, 6.618590354919434, 7.108292579650879, 7.597994804382324, 8.087696075439453, 8.577398300170898, 9.067100524902344, 9.556802749633789, 10.046504974365234, 10.536206245422363, 11.025908470153809, 11.515610694885254, 12.005311965942383, 12.495014190673828, 12.984716415405273, 13.474418640136719, 13.964120864868164, 14.453822135925293, 14.943524360656738]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 16.0, 33.0, 34.0, 58.0, 90.0, 134.0, 248.0, 357.0, 601.0, 961.0, 1633.0, 2382.0, 3941.0, 6262.0, 9619.0, 15173.0, 23643.0, 35746.0, 51521.0, 70706.0, 91636.0, 109447.0, 119570.0, 117140.0, 104669.0, 85282.0, 63499.0, 46308.0, 30977.0, 20858.0, 13259.0, 8456.0, 5296.0, 3271.0, 2115.0, 1321.0, 842.0, 539.0, 322.0, 208.0, 142.0, 91.0, 47.0, 41.0, 15.0, 7.0, 12.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.671875, -15.208740234375, -14.74560546875, -14.282470703125, -13.8193359375, -13.356201171875, -12.89306640625, -12.429931640625, -11.966796875, -11.503662109375, -11.04052734375, -10.577392578125, -10.1142578125, -9.651123046875, -9.18798828125, -8.724853515625, -8.26171875, -7.798583984375, -7.33544921875, -6.872314453125, -6.4091796875, -5.946044921875, -5.48291015625, -5.019775390625, -4.556640625, -4.093505859375, -3.63037109375, -3.167236328125, -2.7041015625, -2.240966796875, -1.77783203125, -1.314697265625, -0.8515625, -0.388427734375, 0.07470703125, 0.537841796875, 1.0009765625, 1.464111328125, 1.92724609375, 2.390380859375, 2.853515625, 3.316650390625, 3.77978515625, 4.242919921875, 4.7060546875, 5.169189453125, 5.63232421875, 6.095458984375, 6.55859375, 7.021728515625, 7.48486328125, 7.947998046875, 8.4111328125, 8.874267578125, 9.33740234375, 9.800537109375, 10.263671875, 10.726806640625, 11.18994140625, 11.653076171875, 12.1162109375, 12.579345703125, 13.04248046875, 13.505615234375, 13.96875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 3.0, 7.0, 8.0, 12.0, 11.0, 13.0, 10.0, 17.0, 20.0, 30.0, 25.0, 26.0, 32.0, 33.0, 28.0, 44.0, 29.0, 31.0, 35.0, 42.0, 52.0, 37.0, 40.0, 33.0, 33.0, 29.0, 25.0, 33.0, 29.0, 24.0, 27.0, 31.0, 23.0, 17.0, 20.0, 15.0, 13.0, 11.0, 6.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-15.921875, -15.4483642578125, -14.974853515625, -14.5013427734375, -14.02783203125, -13.5543212890625, -13.080810546875, -12.6072998046875, -12.1337890625, -11.6602783203125, -11.186767578125, -10.7132568359375, -10.23974609375, -9.7662353515625, -9.292724609375, -8.8192138671875, -8.345703125, -7.8721923828125, -7.398681640625, -6.9251708984375, -6.45166015625, -5.9781494140625, -5.504638671875, -5.0311279296875, -4.5576171875, -4.0841064453125, -3.610595703125, -3.1370849609375, -2.66357421875, -2.1900634765625, -1.716552734375, -1.2430419921875, -0.76953125, -0.2960205078125, 0.177490234375, 0.6510009765625, 1.12451171875, 1.5980224609375, 2.071533203125, 2.5450439453125, 3.0185546875, 3.4920654296875, 3.965576171875, 4.4390869140625, 4.91259765625, 5.3861083984375, 5.859619140625, 6.3331298828125, 6.806640625, 7.2801513671875, 7.753662109375, 8.2271728515625, 8.70068359375, 9.1741943359375, 9.647705078125, 10.1212158203125, 10.5947265625, 11.0682373046875, 11.541748046875, 12.0152587890625, 12.48876953125, 12.9622802734375, 13.435791015625, 13.9093017578125, 14.3828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 9.0, 2.0, 10.0, 29.0, 41.0, 62.0, 102.0, 149.0, 253.0, 389.0, 622.0, 1052.0, 1660.0, 2878.0, 4560.0, 7514.0, 12332.0, 20129.0, 31619.0, 49214.0, 71503.0, 97323.0, 120811.0, 132918.0, 129766.0, 111049.0, 85150.0, 60507.0, 39964.0, 25693.0, 16029.0, 9833.0, 5935.0, 3684.0, 2247.0, 1352.0, 854.0, 504.0, 288.0, 185.0, 119.0, 85.0, 60.0, 33.0, 13.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.796875, -16.2994384765625, -15.802001953125, -15.3045654296875, -14.80712890625, -14.3096923828125, -13.812255859375, -13.3148193359375, -12.8173828125, -12.3199462890625, -11.822509765625, -11.3250732421875, -10.82763671875, -10.3302001953125, -9.832763671875, -9.3353271484375, -8.837890625, -8.3404541015625, -7.843017578125, -7.3455810546875, -6.84814453125, -6.3507080078125, -5.853271484375, -5.3558349609375, -4.8583984375, -4.3609619140625, -3.863525390625, -3.3660888671875, -2.86865234375, -2.3712158203125, -1.873779296875, -1.3763427734375, -0.87890625, -0.3814697265625, 0.115966796875, 0.6134033203125, 1.11083984375, 1.6082763671875, 2.105712890625, 2.6031494140625, 3.1005859375, 3.5980224609375, 4.095458984375, 4.5928955078125, 5.09033203125, 5.5877685546875, 6.085205078125, 6.5826416015625, 7.080078125, 7.5775146484375, 8.074951171875, 8.5723876953125, 9.06982421875, 9.5672607421875, 10.064697265625, 10.5621337890625, 11.0595703125, 11.5570068359375, 12.054443359375, 12.5518798828125, 13.04931640625, 13.5467529296875, 14.044189453125, 14.5416259765625, 15.0390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 12.0, 10.0, 17.0, 24.0, 16.0, 18.0, 23.0, 28.0, 26.0, 24.0, 30.0, 39.0, 39.0, 37.0, 48.0, 38.0, 57.0, 43.0, 45.0, 45.0, 41.0, 44.0, 44.0, 27.0, 29.0, 33.0, 25.0, 20.0, 16.0, 15.0, 16.0, 18.0, 8.0, 12.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.623779296875, -9.26318359375, -8.902587890625, -8.5419921875, -8.181396484375, -7.82080078125, -7.460205078125, -7.099609375, -6.739013671875, -6.37841796875, -6.017822265625, -5.6572265625, -5.296630859375, -4.93603515625, -4.575439453125, -4.21484375, -3.854248046875, -3.49365234375, -3.133056640625, -2.7724609375, -2.411865234375, -2.05126953125, -1.690673828125, -1.330078125, -0.969482421875, -0.60888671875, -0.248291015625, 0.1123046875, 0.472900390625, 0.83349609375, 1.194091796875, 1.5546875, 1.915283203125, 2.27587890625, 2.636474609375, 2.9970703125, 3.357666015625, 3.71826171875, 4.078857421875, 4.439453125, 4.800048828125, 5.16064453125, 5.521240234375, 5.8818359375, 6.242431640625, 6.60302734375, 6.963623046875, 7.32421875, 7.684814453125, 8.04541015625, 8.406005859375, 8.7666015625, 9.127197265625, 9.48779296875, 9.848388671875, 10.208984375, 10.569580078125, 10.93017578125, 11.290771484375, 11.6513671875, 12.011962890625, 12.37255859375, 12.733154296875, 13.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 13.0, 27.0, 35.0, 39.0, 81.0, 119.0, 184.0, 406.0, 679.0, 1614.0, 4335.0, 14057.0, 52391.0, 192113.0, 396462.0, 270869.0, 82699.0, 21812.0, 6349.0, 2266.0, 911.0, 437.0, 224.0, 140.0, 109.0, 56.0, 33.0, 25.0, 21.0, 12.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.6932373046875, -17.167724609375, -16.6422119140625, -16.11669921875, -15.5911865234375, -15.065673828125, -14.5401611328125, -14.0146484375, -13.4891357421875, -12.963623046875, -12.4381103515625, -11.91259765625, -11.3870849609375, -10.861572265625, -10.3360595703125, -9.810546875, -9.2850341796875, -8.759521484375, -8.2340087890625, -7.70849609375, -7.1829833984375, -6.657470703125, -6.1319580078125, -5.6064453125, -5.0809326171875, -4.555419921875, -4.0299072265625, -3.50439453125, -2.9788818359375, -2.453369140625, -1.9278564453125, -1.40234375, -0.8768310546875, -0.351318359375, 0.1741943359375, 0.69970703125, 1.2252197265625, 1.750732421875, 2.2762451171875, 2.8017578125, 3.3272705078125, 3.852783203125, 4.3782958984375, 4.90380859375, 5.4293212890625, 5.954833984375, 6.4803466796875, 7.005859375, 7.5313720703125, 8.056884765625, 8.5823974609375, 9.10791015625, 9.6334228515625, 10.158935546875, 10.6844482421875, 11.2099609375, 11.7354736328125, 12.260986328125, 12.7864990234375, 13.31201171875, 13.8375244140625, 14.363037109375, 14.8885498046875, 15.4140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 3.0, 9.0, 9.0, 13.0, 13.0, 22.0, 32.0, 27.0, 29.0, 34.0, 40.0, 47.0, 56.0, 57.0, 59.0, 51.0, 47.0, 51.0, 67.0, 46.0, 53.0, 43.0, 37.0, 21.0, 24.0, 14.0, 23.0, 16.0, 12.0, 8.0, 7.0, 2.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007190704345703125, -0.0006963014602661133, -0.0006735324859619141, -0.0006507635116577148, -0.0006279945373535156, -0.0006052255630493164, -0.0005824565887451172, -0.000559687614440918, -0.0005369186401367188, -0.0005141496658325195, -0.0004913806915283203, -0.0004686117172241211, -0.0004458427429199219, -0.00042307376861572266, -0.00040030479431152344, -0.0003775358200073242, -0.000354766845703125, -0.0003319978713989258, -0.00030922889709472656, -0.00028645992279052734, -0.0002636909484863281, -0.0002409219741821289, -0.0002181529998779297, -0.00019538402557373047, -0.00017261505126953125, -0.00014984607696533203, -0.0001270771026611328, -0.0001043081283569336, -8.153915405273438e-05, -5.8770179748535156e-05, -3.600120544433594e-05, -1.3232231140136719e-05, 9.5367431640625e-06, 3.230571746826172e-05, 5.507469177246094e-05, 7.784366607666016e-05, 0.00010061264038085938, 0.0001233816146850586, 0.0001461505889892578, 0.00016891956329345703, 0.00019168853759765625, 0.00021445751190185547, 0.0002372264862060547, 0.0002599954605102539, 0.0002827644348144531, 0.00030553340911865234, 0.00032830238342285156, 0.0003510713577270508, 0.00037384033203125, 0.0003966093063354492, 0.00041937828063964844, 0.00044214725494384766, 0.0004649162292480469, 0.0004876852035522461, 0.0005104541778564453, 0.0005332231521606445, 0.0005559921264648438, 0.000578761100769043, 0.0006015300750732422, 0.0006242990493774414, 0.0006470680236816406, 0.0006698369979858398, 0.0006926059722900391, 0.0007153749465942383, 0.0007381439208984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 7.0, 15.0, 21.0, 21.0, 41.0, 32.0, 58.0, 83.0, 91.0, 161.0, 229.0, 346.0, 519.0, 947.0, 1568.0, 2856.0, 5785.0, 11895.0, 25205.0, 55294.0, 114009.0, 192926.0, 234606.0, 189525.0, 110551.0, 53319.0, 24577.0, 11433.0, 5385.0, 2750.0, 1586.0, 936.0, 559.0, 386.0, 249.0, 162.0, 111.0, 92.0, 62.0, 46.0, 33.0, 23.0, 11.0, 10.0, 12.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.3828125, -10.0816650390625, -9.780517578125, -9.4793701171875, -9.17822265625, -8.8770751953125, -8.575927734375, -8.2747802734375, -7.9736328125, -7.6724853515625, -7.371337890625, -7.0701904296875, -6.76904296875, -6.4678955078125, -6.166748046875, -5.8656005859375, -5.564453125, -5.2633056640625, -4.962158203125, -4.6610107421875, -4.35986328125, -4.0587158203125, -3.757568359375, -3.4564208984375, -3.1552734375, -2.8541259765625, -2.552978515625, -2.2518310546875, -1.95068359375, -1.6495361328125, -1.348388671875, -1.0472412109375, -0.74609375, -0.4449462890625, -0.143798828125, 0.1573486328125, 0.45849609375, 0.7596435546875, 1.060791015625, 1.3619384765625, 1.6630859375, 1.9642333984375, 2.265380859375, 2.5665283203125, 2.86767578125, 3.1688232421875, 3.469970703125, 3.7711181640625, 4.072265625, 4.3734130859375, 4.674560546875, 4.9757080078125, 5.27685546875, 5.5780029296875, 5.879150390625, 6.1802978515625, 6.4814453125, 6.7825927734375, 7.083740234375, 7.3848876953125, 7.68603515625, 7.9871826171875, 8.288330078125, 8.5894775390625, 8.890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 13.0, 14.0, 15.0, 26.0, 21.0, 47.0, 52.0, 35.0, 60.0, 82.0, 62.0, 82.0, 82.0, 64.0, 63.0, 62.0, 38.0, 40.0, 28.0, 23.0, 16.0, 11.0, 9.0, 10.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.680908203125, -3.57666015625, -3.472412109375, -3.3681640625, -3.263916015625, -3.15966796875, -3.055419921875, -2.951171875, -2.846923828125, -2.74267578125, -2.638427734375, -2.5341796875, -2.429931640625, -2.32568359375, -2.221435546875, -2.1171875, -2.012939453125, -1.90869140625, -1.804443359375, -1.7001953125, -1.595947265625, -1.49169921875, -1.387451171875, -1.283203125, -1.178955078125, -1.07470703125, -0.970458984375, -0.8662109375, -0.761962890625, -0.65771484375, -0.553466796875, -0.44921875, -0.344970703125, -0.24072265625, -0.136474609375, -0.0322265625, 0.072021484375, 0.17626953125, 0.280517578125, 0.384765625, 0.489013671875, 0.59326171875, 0.697509765625, 0.8017578125, 0.906005859375, 1.01025390625, 1.114501953125, 1.21875, 1.322998046875, 1.42724609375, 1.531494140625, 1.6357421875, 1.739990234375, 1.84423828125, 1.948486328125, 2.052734375, 2.156982421875, 2.26123046875, 2.365478515625, 2.4697265625, 2.573974609375, 2.67822265625, 2.782470703125, 2.88671875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 12.0, 11.0, 19.0, 14.0, 22.0, 38.0, 27.0, 44.0, 44.0, 50.0, 61.0, 60.0, 73.0, 73.0, 61.0, 59.0, 44.0, 49.0, 35.0, 25.0, 35.0, 30.0, 18.0, 26.0, 10.0, 11.0, 7.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.60324478149414, -21.90143585205078, -21.199628829956055, -20.497819900512695, -19.79601287841797, -19.09420394897461, -18.392396926879883, -17.690587997436523, -16.988780975341797, -16.286972045898438, -15.585165023803711, -14.883357048034668, -14.181549072265625, -13.479741096496582, -12.777933120727539, -12.07612419128418, -11.374316215515137, -10.672508239746094, -9.97070026397705, -9.268892288208008, -8.567084312438965, -7.865276336669922, -7.163467884063721, -6.461659908294678, -5.759851932525635, -5.058043956756592, -4.356235980987549, -3.6544277667999268, -2.952619791030884, -2.250811815261841, -1.5490036010742188, -0.8471956253051758, -0.1453876495361328, 0.5564203858375549, 1.2582284212112427, 1.9600365161895752, 2.661844491958618, 3.363652467727661, 4.065460681915283, 4.767268657684326, 5.469076633453369, 6.170884609222412, 6.872692584991455, 7.574501037597656, 8.2763090133667, 8.978116989135742, 9.679924964904785, 10.381732940673828, 11.083540916442871, 11.785348892211914, 12.487156867980957, 13.18896484375, 13.890772819519043, 14.592580795288086, 15.294389724731445, 15.996196746826172, 16.69800567626953, 17.39981460571289, 18.101621627807617, 18.803430557250977, 19.505237579345703, 20.207046508789062, 20.90885353088379, 21.61066246032715, 22.312469482421875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 9.0, 10.0, 14.0, 8.0, 9.0, 19.0, 26.0, 29.0, 28.0, 33.0, 26.0, 30.0, 32.0, 21.0, 36.0, 35.0, 41.0, 26.0, 38.0, 36.0, 36.0, 40.0, 38.0, 37.0, 28.0, 26.0, 41.0, 32.0, 36.0, 14.0, 18.0, 21.0, 11.0, 15.0, 14.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.458547592163086, -13.98674201965332, -13.514936447143555, -13.043129920959473, -12.571324348449707, -12.099518775939941, -11.62771224975586, -11.155906677246094, -10.684101104736328, -10.212295532226562, -9.740489959716797, -9.268683433532715, -8.79687786102295, -8.325072288513184, -7.85326623916626, -7.381460189819336, -6.90965461730957, -6.437849044799805, -5.966042995452881, -5.494236946105957, -5.022431373596191, -4.550625801086426, -4.078819751739502, -3.6070139408111572, -3.1352081298828125, -2.6634023189544678, -2.191596508026123, -1.7197906970977783, -1.2479848861694336, -0.7761790752410889, -0.30437326431274414, 0.16743254661560059, 0.6392393112182617, 1.1110451221466064, 1.5828509330749512, 2.054656744003296, 2.5264625549316406, 2.9982683658599854, 3.47007417678833, 3.941879987716675, 4.4136857986450195, 4.885491371154785, 5.357297420501709, 5.829103469848633, 6.300909042358398, 6.772714614868164, 7.244520664215088, 7.716326713562012, 8.188132286071777, 8.659937858581543, 9.131744384765625, 9.60354995727539, 10.075355529785156, 10.547161102294922, 11.018966674804688, 11.49077320098877, 11.962578773498535, 12.4343843460083, 12.906190872192383, 13.377996444702148, 13.849802017211914, 14.32160758972168, 14.793413162231445, 15.265219688415527, 15.737025260925293]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 2.0, 4.0, 11.0, 16.0, 20.0, 39.0, 57.0, 88.0, 140.0, 228.0, 310.0, 496.0, 789.0, 1248.0, 2121.0, 3385.0, 5542.0, 9091.0, 15171.0, 25820.0, 44833.0, 77748.0, 137315.0, 234872.0, 382726.0, 557524.0, 677968.0, 659385.0, 518410.0, 345413.0, 209379.0, 120248.0, 68883.0, 39388.0, 22705.0, 13197.0, 7818.0, 4640.0, 2802.0, 1664.0, 1058.0, 652.0, 397.0, 261.0, 145.0, 107.0, 75.0, 38.0, 21.0, 20.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.85986328125, -15.3291015625, -14.79833984375, -14.267578125, -13.73681640625, -13.2060546875, -12.67529296875, -12.14453125, -11.61376953125, -11.0830078125, -10.55224609375, -10.021484375, -9.49072265625, -8.9599609375, -8.42919921875, -7.8984375, -7.36767578125, -6.8369140625, -6.30615234375, -5.775390625, -5.24462890625, -4.7138671875, -4.18310546875, -3.65234375, -3.12158203125, -2.5908203125, -2.06005859375, -1.529296875, -0.99853515625, -0.4677734375, 0.06298828125, 0.59375, 1.12451171875, 1.6552734375, 2.18603515625, 2.716796875, 3.24755859375, 3.7783203125, 4.30908203125, 4.83984375, 5.37060546875, 5.9013671875, 6.43212890625, 6.962890625, 7.49365234375, 8.0244140625, 8.55517578125, 9.0859375, 9.61669921875, 10.1474609375, 10.67822265625, 11.208984375, 11.73974609375, 12.2705078125, 12.80126953125, 13.33203125, 13.86279296875, 14.3935546875, 14.92431640625, 15.455078125, 15.98583984375, 16.5166015625, 17.04736328125, 17.578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 10.0, 4.0, 10.0, 16.0, 7.0, 8.0, 21.0, 23.0, 25.0, 35.0, 29.0, 27.0, 26.0, 25.0, 29.0, 44.0, 35.0, 30.0, 29.0, 36.0, 41.0, 27.0, 38.0, 33.0, 46.0, 29.0, 26.0, 30.0, 38.0, 29.0, 23.0, 17.0, 17.0, 16.0, 19.0, 15.0, 11.0, 5.0, 8.0, 6.0, 4.0, 6.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.09375, -11.690185546875, -11.28662109375, -10.883056640625, -10.4794921875, -10.075927734375, -9.67236328125, -9.268798828125, -8.865234375, -8.461669921875, -8.05810546875, -7.654541015625, -7.2509765625, -6.847412109375, -6.44384765625, -6.040283203125, -5.63671875, -5.233154296875, -4.82958984375, -4.426025390625, -4.0224609375, -3.618896484375, -3.21533203125, -2.811767578125, -2.408203125, -2.004638671875, -1.60107421875, -1.197509765625, -0.7939453125, -0.390380859375, 0.01318359375, 0.416748046875, 0.8203125, 1.223876953125, 1.62744140625, 2.031005859375, 2.4345703125, 2.838134765625, 3.24169921875, 3.645263671875, 4.048828125, 4.452392578125, 4.85595703125, 5.259521484375, 5.6630859375, 6.066650390625, 6.47021484375, 6.873779296875, 7.27734375, 7.680908203125, 8.08447265625, 8.488037109375, 8.8916015625, 9.295166015625, 9.69873046875, 10.102294921875, 10.505859375, 10.909423828125, 11.31298828125, 11.716552734375, 12.1201171875, 12.523681640625, 12.92724609375, 13.330810546875, 13.734375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 21.0, 31.0, 60.0, 107.0, 151.0, 221.0, 383.0, 634.0, 1005.0, 1647.0, 2754.0, 4331.0, 7362.0, 12546.0, 20359.0, 33762.0, 56243.0, 92689.0, 149945.0, 235292.0, 350121.0, 475838.0, 569847.0, 583676.0, 506067.0, 385036.0, 264482.0, 170672.0, 106874.0, 64664.0, 38487.0, 23201.0, 14082.0, 8570.0, 5006.0, 3216.0, 1902.0, 1173.0, 709.0, 440.0, 244.0, 164.0, 114.0, 61.0, 29.0, 19.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.65625, -17.1390380859375, -16.621826171875, -16.1046142578125, -15.58740234375, -15.0701904296875, -14.552978515625, -14.0357666015625, -13.5185546875, -13.0013427734375, -12.484130859375, -11.9669189453125, -11.44970703125, -10.9324951171875, -10.415283203125, -9.8980712890625, -9.380859375, -8.8636474609375, -8.346435546875, -7.8292236328125, -7.31201171875, -6.7947998046875, -6.277587890625, -5.7603759765625, -5.2431640625, -4.7259521484375, -4.208740234375, -3.6915283203125, -3.17431640625, -2.6571044921875, -2.139892578125, -1.6226806640625, -1.10546875, -0.5882568359375, -0.071044921875, 0.4461669921875, 0.96337890625, 1.4805908203125, 1.997802734375, 2.5150146484375, 3.0322265625, 3.5494384765625, 4.066650390625, 4.5838623046875, 5.10107421875, 5.6182861328125, 6.135498046875, 6.6527099609375, 7.169921875, 7.6871337890625, 8.204345703125, 8.7215576171875, 9.23876953125, 9.7559814453125, 10.273193359375, 10.7904052734375, 11.3076171875, 11.8248291015625, 12.342041015625, 12.8592529296875, 13.37646484375, 13.8936767578125, 14.410888671875, 14.9281005859375, 15.4453125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 2.0, 11.0, 10.0, 12.0, 20.0, 23.0, 33.0, 41.0, 44.0, 56.0, 69.0, 87.0, 103.0, 124.0, 123.0, 141.0, 164.0, 159.0, 186.0, 180.0, 191.0, 202.0, 219.0, 192.0, 212.0, 195.0, 164.0, 167.0, 142.0, 139.0, 116.0, 109.0, 83.0, 53.0, 65.0, 55.0, 40.0, 34.0, 25.0, 21.0, 19.0, 12.0, 10.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.6546630859375, -5.446044921875, -5.2374267578125, -5.02880859375, -4.8201904296875, -4.611572265625, -4.4029541015625, -4.1943359375, -3.9857177734375, -3.777099609375, -3.5684814453125, -3.35986328125, -3.1512451171875, -2.942626953125, -2.7340087890625, -2.525390625, -2.3167724609375, -2.108154296875, -1.8995361328125, -1.69091796875, -1.4822998046875, -1.273681640625, -1.0650634765625, -0.8564453125, -0.6478271484375, -0.439208984375, -0.2305908203125, -0.02197265625, 0.1866455078125, 0.395263671875, 0.6038818359375, 0.8125, 1.0211181640625, 1.229736328125, 1.4383544921875, 1.64697265625, 1.8555908203125, 2.064208984375, 2.2728271484375, 2.4814453125, 2.6900634765625, 2.898681640625, 3.1072998046875, 3.31591796875, 3.5245361328125, 3.733154296875, 3.9417724609375, 4.150390625, 4.3590087890625, 4.567626953125, 4.7762451171875, 4.98486328125, 5.1934814453125, 5.402099609375, 5.6107177734375, 5.8193359375, 6.0279541015625, 6.236572265625, 6.4451904296875, 6.65380859375, 6.8624267578125, 7.071044921875, 7.2796630859375, 7.48828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 10.0, 12.0, 13.0, 19.0, 17.0, 24.0, 16.0, 24.0, 38.0, 37.0, 37.0, 42.0, 42.0, 45.0, 39.0, 48.0, 56.0, 45.0, 40.0, 54.0, 52.0, 39.0, 38.0, 26.0, 21.0, 28.0, 21.0, 17.0, 9.0, 12.0, 15.0, 10.0, 6.0, 9.0, 5.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.023977279663086, -18.460514068603516, -17.897050857543945, -17.333587646484375, -16.770122528076172, -16.2066593170166, -15.643196105957031, -15.079732894897461, -14.51626968383789, -13.95280647277832, -13.38934326171875, -12.825879096984863, -12.262415885925293, -11.698952674865723, -11.135488510131836, -10.572025299072266, -10.008562088012695, -9.445098876953125, -8.881635665893555, -8.318171501159668, -7.754708290100098, -7.191245079040527, -6.627781391143799, -6.06431770324707, -5.5008544921875, -4.93739128112793, -4.373927593231201, -3.8104641437530518, -3.2470006942749023, -2.683537244796753, -2.1200737953186035, -1.556610345840454, -0.9931449890136719, -0.42968153953552246, 0.13378190994262695, 0.6972453594207764, 1.2607088088989258, 1.8241722583770752, 2.3876357078552246, 2.951099157333374, 3.5145626068115234, 4.078025817871094, 4.641489505767822, 5.204953193664551, 5.768416404724121, 6.331879615783691, 6.89534330368042, 7.458806991577148, 8.022270202636719, 8.585733413696289, 9.14919662475586, 9.712660789489746, 10.276124000549316, 10.839587211608887, 11.403051376342773, 11.966514587402344, 12.529977798461914, 13.093441009521484, 13.656904220581055, 14.220368385314941, 14.783831596374512, 15.347294807434082, 15.910758972167969, 16.47422218322754, 17.03768539428711]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 0.0, 6.0, 5.0, 4.0, 18.0, 13.0, 14.0, 16.0, 19.0, 17.0, 17.0, 27.0, 28.0, 34.0, 29.0, 39.0, 31.0, 44.0, 36.0, 43.0, 29.0, 30.0, 37.0, 48.0, 28.0, 52.0, 49.0, 31.0, 27.0, 31.0, 21.0, 29.0, 30.0, 19.0, 20.0, 15.0, 17.0, 12.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.063995361328125, -15.55224609375, -15.040496826171875, -14.52874755859375, -14.016997337341309, -13.505248069763184, -12.993498802185059, -12.481749534606934, -11.969999313354492, -11.458250045776367, -10.946500778198242, -10.434751510620117, -9.923001289367676, -9.41125202178955, -8.899502754211426, -8.3877534866333, -7.876004219055176, -7.364254951477051, -6.852505207061768, -6.340755939483643, -5.829006195068359, -5.317256927490234, -4.805507659912109, -4.293758392333984, -3.782008647918701, -3.270259141921997, -2.758509635925293, -2.246760368347168, -1.7350108623504639, -1.2232613563537598, -0.7115120887756348, -0.19976258277893066, 0.31198692321777344, 0.8237363696098328, 1.335485816001892, 1.8472352027893066, 2.3589847087860107, 2.870734214782715, 3.38248348236084, 3.894232988357544, 4.405982494354248, 4.917731761932373, 5.429481506347656, 5.941230773925781, 6.452980041503906, 6.9647297859191895, 7.4764790534973145, 7.988228797912598, 8.499978065490723, 9.011727333068848, 9.523476600646973, 10.035226821899414, 10.546976089477539, 11.058725357055664, 11.570474624633789, 12.082223892211914, 12.593973159790039, 13.105722427368164, 13.617471694946289, 14.129220962524414, 14.640971183776855, 15.15272045135498, 15.664469718933105, 16.176219940185547, 16.687969207763672]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 11.0, 17.0, 23.0, 41.0, 59.0, 96.0, 153.0, 222.0, 389.0, 550.0, 777.0, 1295.0, 1889.0, 2921.0, 4461.0, 6301.0, 9243.0, 13621.0, 19382.0, 27045.0, 37338.0, 49335.0, 63444.0, 77593.0, 90373.0, 97928.0, 99175.0, 93690.0, 82764.0, 69304.0, 55081.0, 41819.0, 30902.0, 22062.0, 15432.0, 11044.0, 7479.0, 5049.0, 3511.0, 2325.0, 1546.0, 996.0, 621.0, 429.0, 280.0, 170.0, 125.0, 93.0, 57.0, 34.0, 16.0, 17.0, 12.0, 9.0, 9.0, 1.0, 0.0, 3.0], "bins": [-4.6640625, -4.51922607421875, -4.3743896484375, -4.22955322265625, -4.084716796875, -3.93988037109375, -3.7950439453125, -3.65020751953125, -3.50537109375, -3.36053466796875, -3.2156982421875, -3.07086181640625, -2.926025390625, -2.78118896484375, -2.6363525390625, -2.49151611328125, -2.3466796875, -2.20184326171875, -2.0570068359375, -1.91217041015625, -1.767333984375, -1.62249755859375, -1.4776611328125, -1.33282470703125, -1.18798828125, -1.04315185546875, -0.8983154296875, -0.75347900390625, -0.608642578125, -0.46380615234375, -0.3189697265625, -0.17413330078125, -0.029296875, 0.11553955078125, 0.2603759765625, 0.40521240234375, 0.550048828125, 0.69488525390625, 0.8397216796875, 0.98455810546875, 1.12939453125, 1.27423095703125, 1.4190673828125, 1.56390380859375, 1.708740234375, 1.85357666015625, 1.9984130859375, 2.14324951171875, 2.2880859375, 2.43292236328125, 2.5777587890625, 2.72259521484375, 2.867431640625, 3.01226806640625, 3.1571044921875, 3.30194091796875, 3.44677734375, 3.59161376953125, 3.7364501953125, 3.88128662109375, 4.026123046875, 4.17095947265625, 4.3157958984375, 4.46063232421875, 4.60546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 6.0, 5.0, 5.0, 17.0, 14.0, 11.0, 18.0, 20.0, 16.0, 20.0, 21.0, 32.0, 33.0, 32.0, 34.0, 33.0, 44.0, 38.0, 40.0, 31.0, 30.0, 37.0, 47.0, 30.0, 49.0, 44.0, 32.0, 32.0, 31.0, 21.0, 31.0, 29.0, 17.0, 21.0, 13.0, 20.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.171875, -15.656982421875, -15.14208984375, -14.627197265625, -14.1123046875, -13.597412109375, -13.08251953125, -12.567626953125, -12.052734375, -11.537841796875, -11.02294921875, -10.508056640625, -9.9931640625, -9.478271484375, -8.96337890625, -8.448486328125, -7.93359375, -7.418701171875, -6.90380859375, -6.388916015625, -5.8740234375, -5.359130859375, -4.84423828125, -4.329345703125, -3.814453125, -3.299560546875, -2.78466796875, -2.269775390625, -1.7548828125, -1.239990234375, -0.72509765625, -0.210205078125, 0.3046875, 0.819580078125, 1.33447265625, 1.849365234375, 2.3642578125, 2.879150390625, 3.39404296875, 3.908935546875, 4.423828125, 4.938720703125, 5.45361328125, 5.968505859375, 6.4833984375, 6.998291015625, 7.51318359375, 8.028076171875, 8.54296875, 9.057861328125, 9.57275390625, 10.087646484375, 10.6025390625, 11.117431640625, 11.63232421875, 12.147216796875, 12.662109375, 13.177001953125, 13.69189453125, 14.206787109375, 14.7216796875, 15.236572265625, 15.75146484375, 16.266357421875, 16.78125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 8.0, 17.0, 28.0, 37.0, 66.0, 85.0, 155.0, 284.0, 518.0, 968.0, 1943.0, 4035.0, 7929.0, 16254.0, 35686.0, 750460.0, 175384.0, 28261.0, 13204.0, 6515.0, 3228.0, 1572.0, 809.0, 470.0, 243.0, 149.0, 81.0, 53.0, 32.0, 18.0, 20.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.671875, -22.951416015625, -22.23095703125, -21.510498046875, -20.7900390625, -20.069580078125, -19.34912109375, -18.628662109375, -17.908203125, -17.187744140625, -16.46728515625, -15.746826171875, -15.0263671875, -14.305908203125, -13.58544921875, -12.864990234375, -12.14453125, -11.424072265625, -10.70361328125, -9.983154296875, -9.2626953125, -8.542236328125, -7.82177734375, -7.101318359375, -6.380859375, -5.660400390625, -4.93994140625, -4.219482421875, -3.4990234375, -2.778564453125, -2.05810546875, -1.337646484375, -0.6171875, 0.103271484375, 0.82373046875, 1.544189453125, 2.2646484375, 2.985107421875, 3.70556640625, 4.426025390625, 5.146484375, 5.866943359375, 6.58740234375, 7.307861328125, 8.0283203125, 8.748779296875, 9.46923828125, 10.189697265625, 10.91015625, 11.630615234375, 12.35107421875, 13.071533203125, 13.7919921875, 14.512451171875, 15.23291015625, 15.953369140625, 16.673828125, 17.394287109375, 18.11474609375, 18.835205078125, 19.5556640625, 20.276123046875, 20.99658203125, 21.717041015625, 22.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 5.0, 10.0, 8.0, 18.0, 14.0, 17.0, 19.0, 11.0, 24.0, 24.0, 28.0, 28.0, 38.0, 24.0, 34.0, 34.0, 42.0, 40.0, 43.0, 36.0, 40.0, 29.0, 37.0, 35.0, 39.0, 33.0, 34.0, 34.0, 17.0, 18.0, 31.0, 17.0, 22.0, 15.0, 15.0, 19.0, 13.0, 12.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.78125, -10.4539794921875, -10.126708984375, -9.7994384765625, -9.47216796875, -9.1448974609375, -8.817626953125, -8.4903564453125, -8.1630859375, -7.8358154296875, -7.508544921875, -7.1812744140625, -6.85400390625, -6.5267333984375, -6.199462890625, -5.8721923828125, -5.544921875, -5.2176513671875, -4.890380859375, -4.5631103515625, -4.23583984375, -3.9085693359375, -3.581298828125, -3.2540283203125, -2.9267578125, -2.5994873046875, -2.272216796875, -1.9449462890625, -1.61767578125, -1.2904052734375, -0.963134765625, -0.6358642578125, -0.30859375, 0.0186767578125, 0.345947265625, 0.6732177734375, 1.00048828125, 1.3277587890625, 1.655029296875, 1.9822998046875, 2.3095703125, 2.6368408203125, 2.964111328125, 3.2913818359375, 3.61865234375, 3.9459228515625, 4.273193359375, 4.6004638671875, 4.927734375, 5.2550048828125, 5.582275390625, 5.9095458984375, 6.23681640625, 6.5640869140625, 6.891357421875, 7.2186279296875, 7.5458984375, 7.8731689453125, 8.200439453125, 8.5277099609375, 8.85498046875, 9.1822509765625, 9.509521484375, 9.8367919921875, 10.1640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 11.0, 15.0, 18.0, 23.0, 38.0, 53.0, 70.0, 115.0, 143.0, 188.0, 276.0, 407.0, 655.0, 962.0, 1571.0, 2488.0, 4240.0, 7146.0, 12855.0, 25106.0, 92749.0, 804474.0, 47792.0, 20306.0, 10771.0, 6077.0, 3668.0, 2277.0, 1375.0, 867.0, 538.0, 372.0, 262.0, 173.0, 127.0, 96.0, 52.0, 48.0, 33.0, 25.0, 20.0, 11.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9468307495117188, -0.9156341552734375, -0.8844375610351562, -0.853240966796875, -0.8220443725585938, -0.7908477783203125, -0.7596511840820312, -0.72845458984375, -0.6972579956054688, -0.6660614013671875, -0.6348648071289062, -0.603668212890625, -0.5724716186523438, -0.5412750244140625, -0.5100784301757812, -0.4788818359375, -0.44768524169921875, -0.4164886474609375, -0.38529205322265625, -0.354095458984375, -0.32289886474609375, -0.2917022705078125, -0.26050567626953125, -0.22930908203125, -0.19811248779296875, -0.1669158935546875, -0.13571929931640625, -0.104522705078125, -0.07332611083984375, -0.0421295166015625, -0.01093292236328125, 0.020263671875, 0.05146026611328125, 0.0826568603515625, 0.11385345458984375, 0.145050048828125, 0.17624664306640625, 0.2074432373046875, 0.23863983154296875, 0.26983642578125, 0.30103302001953125, 0.3322296142578125, 0.36342620849609375, 0.394622802734375, 0.42581939697265625, 0.4570159912109375, 0.48821258544921875, 0.5194091796875, 0.5506057739257812, 0.5818023681640625, 0.6129989624023438, 0.644195556640625, 0.6753921508789062, 0.7065887451171875, 0.7377853393554688, 0.76898193359375, 0.8001785278320312, 0.8313751220703125, 0.8625717163085938, 0.893768310546875, 0.9249649047851562, 0.9561614990234375, 0.9873580932617188, 1.0185546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 4.0, 9.0, 10.0, 19.0, 26.0, 35.0, 33.0, 56.0, 60.0, 102.0, 101.0, 84.0, 94.0, 72.0, 58.0, 57.0, 40.0, 34.0, 23.0, 22.0, 13.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021193921566009521, -0.0002047717571258545, -0.00019760429859161377, -0.00019043684005737305, -0.00018326938152313232, -0.0001761019229888916, -0.00016893446445465088, -0.00016176700592041016, -0.00015459954738616943, -0.0001474320888519287, -0.000140264630317688, -0.00013309717178344727, -0.00012592971324920654, -0.00011876225471496582, -0.0001115947961807251, -0.00010442733764648438, -9.725987911224365e-05, -9.009242057800293e-05, -8.292496204376221e-05, -7.575750350952148e-05, -6.859004497528076e-05, -6.142258644104004e-05, -5.4255127906799316e-05, -4.7087669372558594e-05, -3.992021083831787e-05, -3.275275230407715e-05, -2.5585293769836426e-05, -1.8417835235595703e-05, -1.125037670135498e-05, -4.082918167114258e-06, 3.084540367126465e-06, 1.0251998901367188e-05, 1.741945743560791e-05, 2.4586915969848633e-05, 3.1754374504089355e-05, 3.892183303833008e-05, 4.60892915725708e-05, 5.3256750106811523e-05, 6.0424208641052246e-05, 6.759166717529297e-05, 7.475912570953369e-05, 8.192658424377441e-05, 8.909404277801514e-05, 9.626150131225586e-05, 0.00010342895984649658, 0.0001105964183807373, 0.00011776387691497803, 0.00012493133544921875, 0.00013209879398345947, 0.0001392662525177002, 0.00014643371105194092, 0.00015360116958618164, 0.00016076862812042236, 0.00016793608665466309, 0.0001751035451889038, 0.00018227100372314453, 0.00018943846225738525, 0.00019660592079162598, 0.0002037733793258667, 0.00021094083786010742, 0.00021810829639434814, 0.00022527575492858887, 0.0002324432134628296, 0.0002396106719970703]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 10.0, 10.0, 13.0, 31.0, 33.0, 34.0, 48.0, 77.0, 102.0, 144.0, 181.0, 290.0, 382.0, 559.0, 810.0, 1402.0, 2237.0, 3910.0, 6982.0, 13569.0, 25767.0, 48526.0, 86517.0, 136475.0, 179999.0, 183399.0, 145286.0, 94333.0, 54310.0, 29001.0, 15143.0, 7851.0, 4389.0, 2332.0, 1429.0, 938.0, 600.0, 436.0, 284.0, 171.0, 157.0, 107.0, 76.0, 56.0, 41.0, 21.0, 29.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7923812866210938, -0.7668914794921875, -0.7414016723632812, -0.715911865234375, -0.6904220581054688, -0.6649322509765625, -0.6394424438476562, -0.61395263671875, -0.5884628295898438, -0.5629730224609375, -0.5374832153320312, -0.511993408203125, -0.48650360107421875, -0.4610137939453125, -0.43552398681640625, -0.4100341796875, -0.38454437255859375, -0.3590545654296875, -0.33356475830078125, -0.308074951171875, -0.28258514404296875, -0.2570953369140625, -0.23160552978515625, -0.20611572265625, -0.18062591552734375, -0.1551361083984375, -0.12964630126953125, -0.104156494140625, -0.07866668701171875, -0.0531768798828125, -0.02768707275390625, -0.002197265625, 0.02329254150390625, 0.0487823486328125, 0.07427215576171875, 0.099761962890625, 0.12525177001953125, 0.1507415771484375, 0.17623138427734375, 0.20172119140625, 0.22721099853515625, 0.2527008056640625, 0.27819061279296875, 0.303680419921875, 0.32917022705078125, 0.3546600341796875, 0.38014984130859375, 0.4056396484375, 0.43112945556640625, 0.4566192626953125, 0.48210906982421875, 0.507598876953125, 0.5330886840820312, 0.5585784912109375, 0.5840682983398438, 0.60955810546875, 0.6350479125976562, 0.6605377197265625, 0.6860275268554688, 0.711517333984375, 0.7370071411132812, 0.7624969482421875, 0.7879867553710938, 0.8134765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 9.0, 7.0, 17.0, 11.0, 23.0, 21.0, 32.0, 38.0, 46.0, 42.0, 51.0, 52.0, 65.0, 47.0, 51.0, 52.0, 53.0, 35.0, 51.0, 39.0, 41.0, 35.0, 36.0, 27.0, 24.0, 18.0, 19.0, 12.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29443359375, -0.2855873107910156, -0.27674102783203125, -0.2678947448730469, -0.2590484619140625, -0.2502021789550781, -0.24135589599609375, -0.23250961303710938, -0.223663330078125, -0.21481704711914062, -0.20597076416015625, -0.19712448120117188, -0.1882781982421875, -0.17943191528320312, -0.17058563232421875, -0.16173934936523438, -0.15289306640625, -0.14404678344726562, -0.13520050048828125, -0.12635421752929688, -0.1175079345703125, -0.10866165161132812, -0.09981536865234375, -0.09096908569335938, -0.082122802734375, -0.07327651977539062, -0.06443023681640625, -0.055583953857421875, -0.0467376708984375, -0.037891387939453125, -0.02904510498046875, -0.020198822021484375, -0.0113525390625, -0.002506256103515625, 0.00634002685546875, 0.015186309814453125, 0.0240325927734375, 0.032878875732421875, 0.04172515869140625, 0.050571441650390625, 0.059417724609375, 0.06826400756835938, 0.07711029052734375, 0.08595657348632812, 0.0948028564453125, 0.10364913940429688, 0.11249542236328125, 0.12134170532226562, 0.13018798828125, 0.13903427124023438, 0.14788055419921875, 0.15672683715820312, 0.1655731201171875, 0.17441940307617188, 0.18326568603515625, 0.19211196899414062, 0.200958251953125, 0.20980453491210938, 0.21865081787109375, 0.22749710083007812, 0.2363433837890625, 0.24518966674804688, 0.25403594970703125, 0.2628822326660156, 0.271728515625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 3.0, 8.0, 14.0, 13.0, 13.0, 10.0, 27.0, 20.0, 18.0, 27.0, 30.0, 32.0, 47.0, 51.0, 38.0, 55.0, 35.0, 50.0, 45.0, 60.0, 58.0, 44.0, 55.0, 36.0, 32.0, 24.0, 28.0, 23.0, 23.0, 9.0, 13.0, 11.0, 14.0, 7.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3533992767334, -20.755352020263672, -20.157302856445312, -19.559255599975586, -18.96120834350586, -18.3631591796875, -17.765111923217773, -17.167064666748047, -16.569015502929688, -15.970967292785645, -15.372920036315918, -14.774871826171875, -14.176823616027832, -13.578775405883789, -12.980728149414062, -12.38267993927002, -11.784632682800293, -11.18658447265625, -10.588537216186523, -9.99048900604248, -9.392440795898438, -8.794393539428711, -8.196345329284668, -7.598297119140625, -7.00024938583374, -6.4022016525268555, -5.8041534423828125, -5.206105709075928, -4.608057975769043, -4.010009765625, -3.4119620323181152, -2.8139138221740723, -2.2158660888671875, -1.6178181171417236, -1.0197702646255493, -0.421722412109375, 0.17632555961608887, 0.7743735313415527, 1.3724212646484375, 1.9704694747924805, 2.5685172080993652, 3.166565179824829, 3.764613151550293, 4.362660884857178, 4.9607086181640625, 5.5587568283081055, 6.15680456161499, 6.754852771759033, 7.352900505065918, 7.950948238372803, 8.548995971679688, 9.14704418182373, 9.745092391967773, 10.3431396484375, 10.941187858581543, 11.539236068725586, 12.137283325195312, 12.735331535339355, 13.333378791809082, 13.931427001953125, 14.529475212097168, 15.127523422241211, 15.725570678710938, 16.323619842529297, 16.921667098999023]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 2.0, 1.0, 6.0, 4.0, 6.0, 18.0, 14.0, 8.0, 20.0, 21.0, 14.0, 15.0, 24.0, 34.0, 33.0, 28.0, 35.0, 34.0, 44.0, 36.0, 37.0, 39.0, 28.0, 37.0, 46.0, 31.0, 44.0, 47.0, 33.0, 33.0, 31.0, 20.0, 28.0, 30.0, 22.0, 19.0, 10.0, 23.0, 13.0, 9.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.204660415649414, -15.690380096435547, -15.17609977722168, -14.661819458007812, -14.147539138793945, -13.633258819580078, -13.118978500366211, -12.604698181152344, -12.090417861938477, -11.57613754272461, -11.061857223510742, -10.547576904296875, -10.033296585083008, -9.51901626586914, -9.004735946655273, -8.490455627441406, -7.976175308227539, -7.461894989013672, -6.947614669799805, -6.4333343505859375, -5.91905403137207, -5.404773712158203, -4.890493392944336, -4.376213073730469, -3.8619327545166016, -3.3476524353027344, -2.833372116088867, -2.319091796875, -1.8048114776611328, -1.2905311584472656, -0.7762508392333984, -0.26197052001953125, 0.25230979919433594, 0.7665901184082031, 1.2808704376220703, 1.7951507568359375, 2.3094310760498047, 2.823711395263672, 3.337991714477539, 3.8522720336914062, 4.366552352905273, 4.880832672119141, 5.395112991333008, 5.909393310546875, 6.423673629760742, 6.937953948974609, 7.452234268188477, 7.966514587402344, 8.480794906616211, 8.995075225830078, 9.509355545043945, 10.023635864257812, 10.53791618347168, 11.052196502685547, 11.566476821899414, 12.080757141113281, 12.595037460327148, 13.109317779541016, 13.623598098754883, 14.13787841796875, 14.652158737182617, 15.166439056396484, 15.680719375610352, 16.19499969482422, 16.709280014038086]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 11.0, 9.0, 22.0, 33.0, 53.0, 81.0, 117.0, 215.0, 383.0, 537.0, 950.0, 1502.0, 2551.0, 4239.0, 6698.0, 11146.0, 17785.0, 27206.0, 40594.0, 58267.0, 78402.0, 98621.0, 113396.0, 119100.0, 113651.0, 99319.0, 78884.0, 58459.0, 41349.0, 27661.0, 18069.0, 11292.0, 7009.0, 4202.0, 2679.0, 1595.0, 956.0, 564.0, 351.0, 224.0, 152.0, 89.0, 38.0, 31.0, 23.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.060302734375, -14.59716796875, -14.134033203125, -13.6708984375, -13.207763671875, -12.74462890625, -12.281494140625, -11.818359375, -11.355224609375, -10.89208984375, -10.428955078125, -9.9658203125, -9.502685546875, -9.03955078125, -8.576416015625, -8.11328125, -7.650146484375, -7.18701171875, -6.723876953125, -6.2607421875, -5.797607421875, -5.33447265625, -4.871337890625, -4.408203125, -3.945068359375, -3.48193359375, -3.018798828125, -2.5556640625, -2.092529296875, -1.62939453125, -1.166259765625, -0.703125, -0.239990234375, 0.22314453125, 0.686279296875, 1.1494140625, 1.612548828125, 2.07568359375, 2.538818359375, 3.001953125, 3.465087890625, 3.92822265625, 4.391357421875, 4.8544921875, 5.317626953125, 5.78076171875, 6.243896484375, 6.70703125, 7.170166015625, 7.63330078125, 8.096435546875, 8.5595703125, 9.022705078125, 9.48583984375, 9.948974609375, 10.412109375, 10.875244140625, 11.33837890625, 11.801513671875, 12.2646484375, 12.727783203125, 13.19091796875, 13.654052734375, 14.1171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 7.0, 4.0, 5.0, 20.0, 13.0, 6.0, 24.0, 19.0, 16.0, 14.0, 27.0, 30.0, 32.0, 31.0, 29.0, 39.0, 45.0, 37.0, 35.0, 39.0, 28.0, 36.0, 44.0, 32.0, 45.0, 47.0, 36.0, 29.0, 31.0, 17.0, 28.0, 34.0, 20.0, 20.0, 12.0, 17.0, 15.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.421875, -14.93212890625, -14.4423828125, -13.95263671875, -13.462890625, -12.97314453125, -12.4833984375, -11.99365234375, -11.50390625, -11.01416015625, -10.5244140625, -10.03466796875, -9.544921875, -9.05517578125, -8.5654296875, -8.07568359375, -7.5859375, -7.09619140625, -6.6064453125, -6.11669921875, -5.626953125, -5.13720703125, -4.6474609375, -4.15771484375, -3.66796875, -3.17822265625, -2.6884765625, -2.19873046875, -1.708984375, -1.21923828125, -0.7294921875, -0.23974609375, 0.25, 0.73974609375, 1.2294921875, 1.71923828125, 2.208984375, 2.69873046875, 3.1884765625, 3.67822265625, 4.16796875, 4.65771484375, 5.1474609375, 5.63720703125, 6.126953125, 6.61669921875, 7.1064453125, 7.59619140625, 8.0859375, 8.57568359375, 9.0654296875, 9.55517578125, 10.044921875, 10.53466796875, 11.0244140625, 11.51416015625, 12.00390625, 12.49365234375, 12.9833984375, 13.47314453125, 13.962890625, 14.45263671875, 14.9423828125, 15.43212890625, 15.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 17.0, 18.0, 22.0, 49.0, 91.0, 122.0, 223.0, 316.0, 483.0, 763.0, 1211.0, 1841.0, 3014.0, 4571.0, 6878.0, 10774.0, 16021.0, 23547.0, 33993.0, 47444.0, 62228.0, 78737.0, 92586.0, 102971.0, 105551.0, 100995.0, 88504.0, 73181.0, 57056.0, 42618.0, 30872.0, 21105.0, 14290.0, 9276.0, 6110.0, 4039.0, 2498.0, 1657.0, 1057.0, 643.0, 404.0, 288.0, 190.0, 94.0, 70.0, 58.0, 26.0, 26.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.296875, -11.8916015625, -11.486328125, -11.0810546875, -10.67578125, -10.2705078125, -9.865234375, -9.4599609375, -9.0546875, -8.6494140625, -8.244140625, -7.8388671875, -7.43359375, -7.0283203125, -6.623046875, -6.2177734375, -5.8125, -5.4072265625, -5.001953125, -4.5966796875, -4.19140625, -3.7861328125, -3.380859375, -2.9755859375, -2.5703125, -2.1650390625, -1.759765625, -1.3544921875, -0.94921875, -0.5439453125, -0.138671875, 0.2666015625, 0.671875, 1.0771484375, 1.482421875, 1.8876953125, 2.29296875, 2.6982421875, 3.103515625, 3.5087890625, 3.9140625, 4.3193359375, 4.724609375, 5.1298828125, 5.53515625, 5.9404296875, 6.345703125, 6.7509765625, 7.15625, 7.5615234375, 7.966796875, 8.3720703125, 8.77734375, 9.1826171875, 9.587890625, 9.9931640625, 10.3984375, 10.8037109375, 11.208984375, 11.6142578125, 12.01953125, 12.4248046875, 12.830078125, 13.2353515625, 13.640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 9.0, 6.0, 10.0, 14.0, 6.0, 8.0, 14.0, 12.0, 23.0, 23.0, 29.0, 27.0, 27.0, 24.0, 23.0, 28.0, 41.0, 39.0, 32.0, 35.0, 35.0, 51.0, 45.0, 36.0, 41.0, 47.0, 28.0, 37.0, 33.0, 33.0, 28.0, 22.0, 26.0, 22.0, 18.0, 13.0, 10.0, 11.0, 14.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.0777587890625, -9.757080078125, -9.4364013671875, -9.11572265625, -8.7950439453125, -8.474365234375, -8.1536865234375, -7.8330078125, -7.5123291015625, -7.191650390625, -6.8709716796875, -6.55029296875, -6.2296142578125, -5.908935546875, -5.5882568359375, -5.267578125, -4.9468994140625, -4.626220703125, -4.3055419921875, -3.98486328125, -3.6641845703125, -3.343505859375, -3.0228271484375, -2.7021484375, -2.3814697265625, -2.060791015625, -1.7401123046875, -1.41943359375, -1.0987548828125, -0.778076171875, -0.4573974609375, -0.13671875, 0.1839599609375, 0.504638671875, 0.8253173828125, 1.14599609375, 1.4666748046875, 1.787353515625, 2.1080322265625, 2.4287109375, 2.7493896484375, 3.070068359375, 3.3907470703125, 3.71142578125, 4.0321044921875, 4.352783203125, 4.6734619140625, 4.994140625, 5.3148193359375, 5.635498046875, 5.9561767578125, 6.27685546875, 6.5975341796875, 6.918212890625, 7.2388916015625, 7.5595703125, 7.8802490234375, 8.200927734375, 8.5216064453125, 8.84228515625, 9.1629638671875, 9.483642578125, 9.8043212890625, 10.125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 9.0, 12.0, 20.0, 36.0, 48.0, 78.0, 124.0, 198.0, 323.0, 547.0, 916.0, 1552.0, 2789.0, 5175.0, 10570.0, 21912.0, 46586.0, 94500.0, 165161.0, 218825.0, 202794.0, 135553.0, 72269.0, 34867.0, 16409.0, 7733.0, 4135.0, 2221.0, 1228.0, 801.0, 445.0, 252.0, 152.0, 112.0, 66.0, 40.0, 34.0, 18.0, 13.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8203125, -9.52978515625, -9.2392578125, -8.94873046875, -8.658203125, -8.36767578125, -8.0771484375, -7.78662109375, -7.49609375, -7.20556640625, -6.9150390625, -6.62451171875, -6.333984375, -6.04345703125, -5.7529296875, -5.46240234375, -5.171875, -4.88134765625, -4.5908203125, -4.30029296875, -4.009765625, -3.71923828125, -3.4287109375, -3.13818359375, -2.84765625, -2.55712890625, -2.2666015625, -1.97607421875, -1.685546875, -1.39501953125, -1.1044921875, -0.81396484375, -0.5234375, -0.23291015625, 0.0576171875, 0.34814453125, 0.638671875, 0.92919921875, 1.2197265625, 1.51025390625, 1.80078125, 2.09130859375, 2.3818359375, 2.67236328125, 2.962890625, 3.25341796875, 3.5439453125, 3.83447265625, 4.125, 4.41552734375, 4.7060546875, 4.99658203125, 5.287109375, 5.57763671875, 5.8681640625, 6.15869140625, 6.44921875, 6.73974609375, 7.0302734375, 7.32080078125, 7.611328125, 7.90185546875, 8.1923828125, 8.48291015625, 8.7734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 15.0, 12.0, 21.0, 30.0, 28.0, 58.0, 40.0, 53.0, 58.0, 79.0, 83.0, 93.0, 75.0, 69.0, 46.0, 48.0, 48.0, 28.0, 20.0, 26.0, 18.0, 12.0, 14.0, 4.0, 7.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011987686157226562, -0.0011665523052215576, -0.001134335994720459, -0.0011021196842193604, -0.0010699033737182617, -0.001037687063217163, -0.0010054707527160645, -0.0009732544422149658, -0.0009410381317138672, -0.0009088218212127686, -0.0008766055107116699, -0.0008443892002105713, -0.0008121728897094727, -0.000779956579208374, -0.0007477402687072754, -0.0007155239582061768, -0.0006833076477050781, -0.0006510913372039795, -0.0006188750267028809, -0.0005866587162017822, -0.0005544424057006836, -0.000522226095199585, -0.0004900097846984863, -0.0004577934741973877, -0.00042557716369628906, -0.00039336085319519043, -0.0003611445426940918, -0.00032892823219299316, -0.00029671192169189453, -0.0002644956111907959, -0.00023227930068969727, -0.00020006299018859863, -0.0001678466796875, -0.00013563036918640137, -0.00010341405868530273, -7.11977481842041e-05, -3.898143768310547e-05, -6.765127182006836e-06, 2.5451183319091797e-05, 5.766749382019043e-05, 8.988380432128906e-05, 0.0001221001148223877, 0.00015431642532348633, 0.00018653273582458496, 0.0002187490463256836, 0.0002509653568267822, 0.00028318166732788086, 0.0003153979778289795, 0.0003476142883300781, 0.00037983059883117676, 0.0004120469093322754, 0.000444263219833374, 0.00047647953033447266, 0.0005086958408355713, 0.0005409121513366699, 0.0005731284618377686, 0.0006053447723388672, 0.0006375610828399658, 0.0006697773933410645, 0.0007019937038421631, 0.0007342100143432617, 0.0007664263248443604, 0.000798642635345459, 0.0008308589458465576, 0.0008630752563476562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 15.0, 11.0, 16.0, 30.0, 33.0, 52.0, 86.0, 119.0, 177.0, 232.0, 343.0, 513.0, 706.0, 1012.0, 1581.0, 2564.0, 4054.0, 6531.0, 10848.0, 18289.0, 32014.0, 55131.0, 90143.0, 133934.0, 166406.0, 166935.0, 132907.0, 90051.0, 55296.0, 31455.0, 18209.0, 10875.0, 6478.0, 3946.0, 2515.0, 1585.0, 1070.0, 742.0, 519.0, 360.0, 251.0, 163.0, 107.0, 86.0, 42.0, 53.0, 21.0, 16.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-7.76953125, -7.5340576171875, -7.298583984375, -7.0631103515625, -6.82763671875, -6.5921630859375, -6.356689453125, -6.1212158203125, -5.8857421875, -5.6502685546875, -5.414794921875, -5.1793212890625, -4.94384765625, -4.7083740234375, -4.472900390625, -4.2374267578125, -4.001953125, -3.7664794921875, -3.531005859375, -3.2955322265625, -3.06005859375, -2.8245849609375, -2.589111328125, -2.3536376953125, -2.1181640625, -1.8826904296875, -1.647216796875, -1.4117431640625, -1.17626953125, -0.9407958984375, -0.705322265625, -0.4698486328125, -0.234375, 0.0010986328125, 0.236572265625, 0.4720458984375, 0.70751953125, 0.9429931640625, 1.178466796875, 1.4139404296875, 1.6494140625, 1.8848876953125, 2.120361328125, 2.3558349609375, 2.59130859375, 2.8267822265625, 3.062255859375, 3.2977294921875, 3.533203125, 3.7686767578125, 4.004150390625, 4.2396240234375, 4.47509765625, 4.7105712890625, 4.946044921875, 5.1815185546875, 5.4169921875, 5.6524658203125, 5.887939453125, 6.1234130859375, 6.35888671875, 6.5943603515625, 6.829833984375, 7.0653076171875, 7.30078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 10.0, 12.0, 5.0, 10.0, 14.0, 12.0, 23.0, 23.0, 25.0, 48.0, 52.0, 54.0, 53.0, 49.0, 60.0, 48.0, 51.0, 64.0, 49.0, 53.0, 49.0, 38.0, 39.0, 26.0, 26.0, 21.0, 24.0, 10.0, 9.0, 10.0, 5.0, 7.0, 7.0, 1.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.34283447265625, -3.2501220703125, -3.15740966796875, -3.064697265625, -2.97198486328125, -2.8792724609375, -2.78656005859375, -2.69384765625, -2.60113525390625, -2.5084228515625, -2.41571044921875, -2.322998046875, -2.23028564453125, -2.1375732421875, -2.04486083984375, -1.9521484375, -1.85943603515625, -1.7667236328125, -1.67401123046875, -1.581298828125, -1.48858642578125, -1.3958740234375, -1.30316162109375, -1.21044921875, -1.11773681640625, -1.0250244140625, -0.93231201171875, -0.839599609375, -0.74688720703125, -0.6541748046875, -0.56146240234375, -0.46875, -0.37603759765625, -0.2833251953125, -0.19061279296875, -0.097900390625, -0.00518798828125, 0.0875244140625, 0.18023681640625, 0.27294921875, 0.36566162109375, 0.4583740234375, 0.55108642578125, 0.643798828125, 0.73651123046875, 0.8292236328125, 0.92193603515625, 1.0146484375, 1.10736083984375, 1.2000732421875, 1.29278564453125, 1.385498046875, 1.47821044921875, 1.5709228515625, 1.66363525390625, 1.75634765625, 1.84906005859375, 1.9417724609375, 2.03448486328125, 2.127197265625, 2.21990966796875, 2.3126220703125, 2.40533447265625, 2.498046875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 6.0, 12.0, 8.0, 16.0, 17.0, 11.0, 19.0, 23.0, 28.0, 32.0, 28.0, 44.0, 31.0, 35.0, 38.0, 45.0, 48.0, 34.0, 68.0, 49.0, 56.0, 40.0, 44.0, 25.0, 32.0, 26.0, 29.0, 18.0, 25.0, 16.0, 16.0, 10.0, 10.0, 9.0, 8.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0], "bins": [-19.33016014099121, -18.796630859375, -18.26310157775879, -17.729572296142578, -17.196041107177734, -16.662511825561523, -16.128982543945312, -15.595453262329102, -15.06192398071289, -14.52839469909668, -13.994865417480469, -13.461335182189941, -12.92780590057373, -12.39427661895752, -11.860746383666992, -11.327217102050781, -10.79368782043457, -10.26015853881836, -9.726629257202148, -9.193099021911621, -8.65956974029541, -8.1260404586792, -7.59251070022583, -7.058980941772461, -6.52545166015625, -5.991922378540039, -5.45839262008667, -4.924862861633301, -4.39133358001709, -3.8578040599823, -3.3242745399475098, -2.7907450199127197, -2.2572174072265625, -1.7236878871917725, -1.1901583671569824, -0.6566288471221924, -0.12309932708740234, 0.4104301929473877, 0.9439597129821777, 1.4774892330169678, 2.011018753051758, 2.544548273086548, 3.078077793121338, 3.611607313156128, 4.145136833190918, 4.678666114807129, 5.212195873260498, 5.745725631713867, 6.279254913330078, 6.812784194946289, 7.346313953399658, 7.879843711853027, 8.413372993469238, 8.94690227508545, 9.480432510375977, 10.013961791992188, 10.547491073608398, 11.08102035522461, 11.61454963684082, 12.148079872131348, 12.681609153747559, 13.21513843536377, 13.748668670654297, 14.282197952270508, 14.815727233886719]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 12.0, 20.0, 20.0, 22.0, 14.0, 27.0, 21.0, 29.0, 29.0, 28.0, 36.0, 34.0, 44.0, 39.0, 47.0, 33.0, 38.0, 35.0, 38.0, 30.0, 47.0, 35.0, 28.0, 40.0, 36.0, 38.0, 32.0, 12.0, 20.0, 12.0, 8.0, 12.0, 12.0, 7.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.04225730895996, -16.521116256713867, -15.999974250793457, -15.478833198547363, -14.95769214630127, -14.43655014038086, -13.915409088134766, -13.394268035888672, -12.873126983642578, -12.351985931396484, -11.830843925476074, -11.30970287322998, -10.788561820983887, -10.267419815063477, -9.746278762817383, -9.225137710571289, -8.703995704650879, -8.182854652404785, -7.661713123321533, -7.140571594238281, -6.6194305419921875, -6.0982890129089355, -5.577147483825684, -5.05600643157959, -4.534864902496338, -4.013723373413086, -3.492582321166992, -2.9714407920837402, -2.4502995014190674, -1.9291582107543945, -1.4080166816711426, -0.8868753910064697, -0.3657341003417969, 0.15540724992752075, 0.6765486001968384, 1.1976900100708008, 1.7188313007354736, 2.2399725914001465, 2.7611141204833984, 3.2822554111480713, 3.803396701812744, 4.324538230895996, 4.84567928314209, 5.366820812225342, 5.887962341308594, 6.4091033935546875, 6.9302449226379395, 7.451386451721191, 7.972527503967285, 8.493668556213379, 9.014810562133789, 9.535951614379883, 10.057092666625977, 10.57823371887207, 11.09937572479248, 11.620516777038574, 12.141658782958984, 12.662799835205078, 13.183941841125488, 13.705082893371582, 14.226223945617676, 14.747365951538086, 15.26850700378418, 15.789648056030273, 16.310789108276367]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 9.0, 13.0, 30.0, 35.0, 53.0, 83.0, 106.0, 182.0, 295.0, 439.0, 715.0, 1197.0, 1930.0, 3210.0, 5222.0, 8721.0, 14763.0, 25444.0, 44534.0, 77614.0, 134849.0, 232610.0, 375754.0, 543356.0, 664508.0, 657022.0, 525941.0, 357943.0, 219142.0, 127717.0, 72774.0, 41187.0, 23795.0, 13744.0, 7870.0, 4497.0, 2761.0, 1602.0, 1014.0, 620.0, 363.0, 220.0, 136.0, 100.0, 52.0, 38.0, 27.0, 12.0, 16.0, 9.0, 3.0, 2.0, 2.0, 5.0], "bins": [-18.53125, -18.0008544921875, -17.470458984375, -16.9400634765625, -16.40966796875, -15.8792724609375, -15.348876953125, -14.8184814453125, -14.2880859375, -13.7576904296875, -13.227294921875, -12.6968994140625, -12.16650390625, -11.6361083984375, -11.105712890625, -10.5753173828125, -10.044921875, -9.5145263671875, -8.984130859375, -8.4537353515625, -7.92333984375, -7.3929443359375, -6.862548828125, -6.3321533203125, -5.8017578125, -5.2713623046875, -4.740966796875, -4.2105712890625, -3.68017578125, -3.1497802734375, -2.619384765625, -2.0889892578125, -1.55859375, -1.0281982421875, -0.497802734375, 0.0325927734375, 0.56298828125, 1.0933837890625, 1.623779296875, 2.1541748046875, 2.6845703125, 3.2149658203125, 3.745361328125, 4.2757568359375, 4.80615234375, 5.3365478515625, 5.866943359375, 6.3973388671875, 6.927734375, 7.4581298828125, 7.988525390625, 8.5189208984375, 9.04931640625, 9.5797119140625, 10.110107421875, 10.6405029296875, 11.1708984375, 11.7012939453125, 12.231689453125, 12.7620849609375, 13.29248046875, 13.8228759765625, 14.353271484375, 14.8836669921875, 15.4140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 6.0, 5.0, 5.0, 11.0, 9.0, 5.0, 19.0, 18.0, 23.0, 14.0, 23.0, 25.0, 25.0, 25.0, 31.0, 34.0, 30.0, 37.0, 41.0, 45.0, 44.0, 29.0, 38.0, 38.0, 31.0, 38.0, 35.0, 39.0, 32.0, 42.0, 38.0, 33.0, 23.0, 18.0, 17.0, 13.0, 4.0, 13.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.734375, -14.2796630859375, -13.824951171875, -13.3702392578125, -12.91552734375, -12.4608154296875, -12.006103515625, -11.5513916015625, -11.0966796875, -10.6419677734375, -10.187255859375, -9.7325439453125, -9.27783203125, -8.8231201171875, -8.368408203125, -7.9136962890625, -7.458984375, -7.0042724609375, -6.549560546875, -6.0948486328125, -5.64013671875, -5.1854248046875, -4.730712890625, -4.2760009765625, -3.8212890625, -3.3665771484375, -2.911865234375, -2.4571533203125, -2.00244140625, -1.5477294921875, -1.093017578125, -0.6383056640625, -0.18359375, 0.2711181640625, 0.725830078125, 1.1805419921875, 1.63525390625, 2.0899658203125, 2.544677734375, 2.9993896484375, 3.4541015625, 3.9088134765625, 4.363525390625, 4.8182373046875, 5.27294921875, 5.7276611328125, 6.182373046875, 6.6370849609375, 7.091796875, 7.5465087890625, 8.001220703125, 8.4559326171875, 8.91064453125, 9.3653564453125, 9.820068359375, 10.2747802734375, 10.7294921875, 11.1842041015625, 11.638916015625, 12.0936279296875, 12.54833984375, 13.0030517578125, 13.457763671875, 13.9124755859375, 14.3671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 14.0, 15.0, 31.0, 42.0, 69.0, 111.0, 172.0, 291.0, 428.0, 676.0, 1131.0, 1708.0, 2850.0, 4401.0, 7189.0, 11674.0, 18923.0, 30652.0, 49281.0, 78871.0, 123327.0, 189698.0, 278984.0, 382191.0, 481555.0, 535924.0, 522133.0, 446247.0, 341766.0, 242477.0, 162541.0, 104933.0, 65959.0, 40962.0, 25330.0, 16035.0, 9682.0, 5894.0, 3712.0, 2364.0, 1478.0, 919.0, 621.0, 393.0, 226.0, 108.0, 116.0, 63.0, 39.0, 38.0, 17.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.1171875, -14.6419677734375, -14.166748046875, -13.6915283203125, -13.21630859375, -12.7410888671875, -12.265869140625, -11.7906494140625, -11.3154296875, -10.8402099609375, -10.364990234375, -9.8897705078125, -9.41455078125, -8.9393310546875, -8.464111328125, -7.9888916015625, -7.513671875, -7.0384521484375, -6.563232421875, -6.0880126953125, -5.61279296875, -5.1375732421875, -4.662353515625, -4.1871337890625, -3.7119140625, -3.2366943359375, -2.761474609375, -2.2862548828125, -1.81103515625, -1.3358154296875, -0.860595703125, -0.3853759765625, 0.08984375, 0.5650634765625, 1.040283203125, 1.5155029296875, 1.99072265625, 2.4659423828125, 2.941162109375, 3.4163818359375, 3.8916015625, 4.3668212890625, 4.842041015625, 5.3172607421875, 5.79248046875, 6.2677001953125, 6.742919921875, 7.2181396484375, 7.693359375, 8.1685791015625, 8.643798828125, 9.1190185546875, 9.59423828125, 10.0694580078125, 10.544677734375, 11.0198974609375, 11.4951171875, 11.9703369140625, 12.445556640625, 12.9207763671875, 13.39599609375, 13.8712158203125, 14.346435546875, 14.8216552734375, 15.296875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 10.0, 12.0, 23.0, 27.0, 35.0, 44.0, 52.0, 73.0, 99.0, 96.0, 120.0, 172.0, 173.0, 197.0, 222.0, 240.0, 257.0, 235.0, 239.0, 242.0, 250.0, 215.0, 186.0, 169.0, 119.0, 104.0, 96.0, 88.0, 61.0, 54.0, 35.0, 28.0, 16.0, 18.0, 14.0, 14.0, 8.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.16107177734375, -6.9119873046875, -6.66290283203125, -6.413818359375, -6.16473388671875, -5.9156494140625, -5.66656494140625, -5.41748046875, -5.16839599609375, -4.9193115234375, -4.67022705078125, -4.421142578125, -4.17205810546875, -3.9229736328125, -3.67388916015625, -3.4248046875, -3.17572021484375, -2.9266357421875, -2.67755126953125, -2.428466796875, -2.17938232421875, -1.9302978515625, -1.68121337890625, -1.43212890625, -1.18304443359375, -0.9339599609375, -0.68487548828125, -0.435791015625, -0.18670654296875, 0.0623779296875, 0.31146240234375, 0.560546875, 0.80963134765625, 1.0587158203125, 1.30780029296875, 1.556884765625, 1.80596923828125, 2.0550537109375, 2.30413818359375, 2.55322265625, 2.80230712890625, 3.0513916015625, 3.30047607421875, 3.549560546875, 3.79864501953125, 4.0477294921875, 4.29681396484375, 4.5458984375, 4.79498291015625, 5.0440673828125, 5.29315185546875, 5.542236328125, 5.79132080078125, 6.0404052734375, 6.28948974609375, 6.53857421875, 6.78765869140625, 7.0367431640625, 7.28582763671875, 7.534912109375, 7.78399658203125, 8.0330810546875, 8.28216552734375, 8.53125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 12.0, 10.0, 15.0, 15.0, 14.0, 27.0, 24.0, 34.0, 32.0, 41.0, 46.0, 64.0, 34.0, 51.0, 41.0, 56.0, 45.0, 54.0, 49.0, 49.0, 53.0, 34.0, 25.0, 31.0, 26.0, 19.0, 19.0, 17.0, 13.0, 9.0, 8.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.411867141723633, -16.836896896362305, -16.26192855834961, -15.686959266662598, -15.111989974975586, -14.537019729614258, -13.962050437927246, -13.387081146240234, -12.812111854553223, -12.237142562866211, -11.6621732711792, -11.087203979492188, -10.51223373413086, -9.937265396118164, -9.362295150756836, -8.787325859069824, -8.212356567382812, -7.637387275695801, -7.062417984008789, -6.487448215484619, -5.912478923797607, -5.337509632110596, -4.762539863586426, -4.187570571899414, -3.6126012802124023, -3.0376319885253906, -2.4626624584198, -1.8876930475234985, -1.3127236366271973, -0.7377543449401855, -0.16278481483459473, 0.4121847152709961, 0.9871559143066406, 1.562125325202942, 2.137094736099243, 2.712064266204834, 3.2870335578918457, 3.8620028495788574, 4.436972618103027, 5.011941909790039, 5.586911201477051, 6.1618804931640625, 6.736849784851074, 7.311819553375244, 7.886788845062256, 8.46175765991211, 9.036727905273438, 9.61169719696045, 10.186666488647461, 10.761635780334473, 11.336605072021484, 11.911574363708496, 12.486543655395508, 13.061513900756836, 13.636483192443848, 14.21145248413086, 14.786421775817871, 15.361391067504883, 15.936360359191895, 16.511329650878906, 17.086299896240234, 17.66126823425293, 18.236238479614258, 18.811206817626953, 19.38617706298828]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 7.0, 3.0, 5.0, 11.0, 9.0, 9.0, 13.0, 19.0, 25.0, 20.0, 21.0, 42.0, 24.0, 30.0, 38.0, 37.0, 46.0, 39.0, 39.0, 41.0, 40.0, 50.0, 37.0, 42.0, 38.0, 38.0, 36.0, 30.0, 27.0, 30.0, 24.0, 26.0, 21.0, 21.0, 12.0, 4.0, 8.0, 13.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-19.561710357666016, -19.025951385498047, -18.490190505981445, -17.954431533813477, -17.418670654296875, -16.882911682128906, -16.347150802612305, -15.811391830444336, -15.275630950927734, -14.73987102508545, -14.204111099243164, -13.668351173400879, -13.132591247558594, -12.596831321716309, -12.061071395874023, -11.525312423706055, -10.98955249786377, -10.453792572021484, -9.9180326461792, -9.382272720336914, -8.846512794494629, -8.310752868652344, -7.774993419647217, -7.239233493804932, -6.7034735679626465, -6.167713642120361, -5.631953716278076, -5.096194267272949, -4.560434341430664, -4.024674415588379, -3.4889144897460938, -2.9531545639038086, -2.417393684387207, -1.8816337585449219, -1.3458739519119263, -0.8101141452789307, -0.2743542194366455, 0.26140570640563965, 0.7971653938293457, 1.3329253196716309, 1.868685245513916, 2.404445171356201, 2.9402050971984863, 3.4759647846221924, 4.011724472045898, 4.547484397888184, 5.083244323730469, 5.619004249572754, 6.154764175415039, 6.690524101257324, 7.226284027099609, 7.7620439529418945, 8.29780387878418, 8.833563804626465, 9.36932373046875, 9.905082702636719, 10.44084358215332, 10.976603507995605, 11.51236343383789, 12.048123359680176, 12.583883285522461, 13.119643211364746, 13.655403137207031, 14.191162109375, 14.726922035217285]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 15.0, 15.0, 27.0, 44.0, 68.0, 119.0, 161.0, 302.0, 484.0, 837.0, 1351.0, 2189.0, 3743.0, 6019.0, 9935.0, 15733.0, 24415.0, 37926.0, 54863.0, 77045.0, 99707.0, 118235.0, 125733.0, 119720.0, 102111.0, 79606.0, 58080.0, 39507.0, 26296.0, 16785.0, 10649.0, 6494.0, 4087.0, 2495.0, 1546.0, 823.0, 553.0, 292.0, 213.0, 118.0, 75.0, 51.0, 33.0, 25.0, 14.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99951171875, -4.8505859375, -4.70166015625, -4.552734375, -4.40380859375, -4.2548828125, -4.10595703125, -3.95703125, -3.80810546875, -3.6591796875, -3.51025390625, -3.361328125, -3.21240234375, -3.0634765625, -2.91455078125, -2.765625, -2.61669921875, -2.4677734375, -2.31884765625, -2.169921875, -2.02099609375, -1.8720703125, -1.72314453125, -1.57421875, -1.42529296875, -1.2763671875, -1.12744140625, -0.978515625, -0.82958984375, -0.6806640625, -0.53173828125, -0.3828125, -0.23388671875, -0.0849609375, 0.06396484375, 0.212890625, 0.36181640625, 0.5107421875, 0.65966796875, 0.80859375, 0.95751953125, 1.1064453125, 1.25537109375, 1.404296875, 1.55322265625, 1.7021484375, 1.85107421875, 2.0, 2.14892578125, 2.2978515625, 2.44677734375, 2.595703125, 2.74462890625, 2.8935546875, 3.04248046875, 3.19140625, 3.34033203125, 3.4892578125, 3.63818359375, 3.787109375, 3.93603515625, 4.0849609375, 4.23388671875, 4.3828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 3.0, 3.0, 12.0, 10.0, 9.0, 13.0, 19.0, 22.0, 22.0, 23.0, 39.0, 29.0, 26.0, 37.0, 36.0, 48.0, 38.0, 37.0, 44.0, 39.0, 51.0, 36.0, 40.0, 38.0, 42.0, 35.0, 28.0, 25.0, 32.0, 23.0, 25.0, 26.0, 19.0, 12.0, 4.0, 10.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-19.578125, -19.0416259765625, -18.505126953125, -17.9686279296875, -17.43212890625, -16.8956298828125, -16.359130859375, -15.8226318359375, -15.2861328125, -14.7496337890625, -14.213134765625, -13.6766357421875, -13.14013671875, -12.6036376953125, -12.067138671875, -11.5306396484375, -10.994140625, -10.4576416015625, -9.921142578125, -9.3846435546875, -8.84814453125, -8.3116455078125, -7.775146484375, -7.2386474609375, -6.7021484375, -6.1656494140625, -5.629150390625, -5.0926513671875, -4.55615234375, -4.0196533203125, -3.483154296875, -2.9466552734375, -2.41015625, -1.8736572265625, -1.337158203125, -0.8006591796875, -0.26416015625, 0.2723388671875, 0.808837890625, 1.3453369140625, 1.8818359375, 2.4183349609375, 2.954833984375, 3.4913330078125, 4.02783203125, 4.5643310546875, 5.100830078125, 5.6373291015625, 6.173828125, 6.7103271484375, 7.246826171875, 7.7833251953125, 8.31982421875, 8.8563232421875, 9.392822265625, 9.9293212890625, 10.4658203125, 11.0023193359375, 11.538818359375, 12.0753173828125, 12.61181640625, 13.1483154296875, 13.684814453125, 14.2213134765625, 14.7578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 6.0, 17.0, 11.0, 14.0, 25.0, 43.0, 56.0, 95.0, 136.0, 210.0, 378.0, 522.0, 953.0, 1445.0, 2464.0, 4117.0, 6904.0, 11730.0, 21013.0, 41091.0, 820811.0, 76760.0, 25269.0, 14069.0, 8109.0, 4905.0, 2838.0, 1735.0, 1031.0, 603.0, 405.0, 247.0, 178.0, 96.0, 78.0, 49.0, 30.0, 25.0, 16.0, 13.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0], "bins": [-15.28125, -14.8133544921875, -14.345458984375, -13.8775634765625, -13.40966796875, -12.9417724609375, -12.473876953125, -12.0059814453125, -11.5380859375, -11.0701904296875, -10.602294921875, -10.1343994140625, -9.66650390625, -9.1986083984375, -8.730712890625, -8.2628173828125, -7.794921875, -7.3270263671875, -6.859130859375, -6.3912353515625, -5.92333984375, -5.4554443359375, -4.987548828125, -4.5196533203125, -4.0517578125, -3.5838623046875, -3.115966796875, -2.6480712890625, -2.18017578125, -1.7122802734375, -1.244384765625, -0.7764892578125, -0.30859375, 0.1593017578125, 0.627197265625, 1.0950927734375, 1.56298828125, 2.0308837890625, 2.498779296875, 2.9666748046875, 3.4345703125, 3.9024658203125, 4.370361328125, 4.8382568359375, 5.30615234375, 5.7740478515625, 6.241943359375, 6.7098388671875, 7.177734375, 7.6456298828125, 8.113525390625, 8.5814208984375, 9.04931640625, 9.5172119140625, 9.985107421875, 10.4530029296875, 10.9208984375, 11.3887939453125, 11.856689453125, 12.3245849609375, 12.79248046875, 13.2603759765625, 13.728271484375, 14.1961669921875, 14.6640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 6.0, 13.0, 8.0, 8.0, 13.0, 14.0, 17.0, 19.0, 25.0, 24.0, 34.0, 24.0, 39.0, 38.0, 38.0, 40.0, 42.0, 39.0, 40.0, 36.0, 37.0, 38.0, 27.0, 36.0, 30.0, 41.0, 31.0, 29.0, 30.0, 24.0, 19.0, 15.0, 18.0, 26.0, 10.0, 10.0, 12.0, 13.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.5606689453125, -8.222900390625, -7.8851318359375, -7.54736328125, -7.2095947265625, -6.871826171875, -6.5340576171875, -6.1962890625, -5.8585205078125, -5.520751953125, -5.1829833984375, -4.84521484375, -4.5074462890625, -4.169677734375, -3.8319091796875, -3.494140625, -3.1563720703125, -2.818603515625, -2.4808349609375, -2.14306640625, -1.8052978515625, -1.467529296875, -1.1297607421875, -0.7919921875, -0.4542236328125, -0.116455078125, 0.2213134765625, 0.55908203125, 0.8968505859375, 1.234619140625, 1.5723876953125, 1.91015625, 2.2479248046875, 2.585693359375, 2.9234619140625, 3.26123046875, 3.5989990234375, 3.936767578125, 4.2745361328125, 4.6123046875, 4.9500732421875, 5.287841796875, 5.6256103515625, 5.96337890625, 6.3011474609375, 6.638916015625, 6.9766845703125, 7.314453125, 7.6522216796875, 7.989990234375, 8.3277587890625, 8.66552734375, 9.0032958984375, 9.341064453125, 9.6788330078125, 10.0166015625, 10.3543701171875, 10.692138671875, 11.0299072265625, 11.36767578125, 11.7054443359375, 12.043212890625, 12.3809814453125, 12.71875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 13.0, 14.0, 26.0, 20.0, 39.0, 63.0, 96.0, 120.0, 186.0, 272.0, 406.0, 612.0, 962.0, 1635.0, 2519.0, 4280.0, 7135.0, 12626.0, 23838.0, 71413.0, 824973.0, 48374.0, 21006.0, 11217.0, 6509.0, 3817.0, 2310.0, 1445.0, 866.0, 598.0, 357.0, 274.0, 146.0, 95.0, 97.0, 47.0, 47.0, 14.0, 18.0, 18.0, 11.0, 8.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.7886428833007812, -0.7608795166015625, -0.7331161499023438, -0.705352783203125, -0.6775894165039062, -0.6498260498046875, -0.6220626831054688, -0.59429931640625, -0.5665359497070312, -0.5387725830078125, -0.5110092163085938, -0.483245849609375, -0.45548248291015625, -0.4277191162109375, -0.39995574951171875, -0.3721923828125, -0.34442901611328125, -0.3166656494140625, -0.28890228271484375, -0.261138916015625, -0.23337554931640625, -0.2056121826171875, -0.17784881591796875, -0.15008544921875, -0.12232208251953125, -0.0945587158203125, -0.06679534912109375, -0.039031982421875, -0.01126861572265625, 0.0164947509765625, 0.04425811767578125, 0.072021484375, 0.09978485107421875, 0.1275482177734375, 0.15531158447265625, 0.183074951171875, 0.21083831787109375, 0.2386016845703125, 0.26636505126953125, 0.29412841796875, 0.32189178466796875, 0.3496551513671875, 0.37741851806640625, 0.405181884765625, 0.43294525146484375, 0.4607086181640625, 0.48847198486328125, 0.5162353515625, 0.5439987182617188, 0.5717620849609375, 0.5995254516601562, 0.627288818359375, 0.6550521850585938, 0.6828155517578125, 0.7105789184570312, 0.73834228515625, 0.7661056518554688, 0.7938690185546875, 0.8216323852539062, 0.849395751953125, 0.8771591186523438, 0.9049224853515625, 0.9326858520507812, 0.96044921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 7.0, 11.0, 12.0, 11.0, 17.0, 13.0, 23.0, 29.0, 39.0, 40.0, 38.0, 54.0, 57.0, 65.0, 67.0, 62.0, 64.0, 50.0, 48.0, 44.0, 45.0, 27.0, 35.0, 15.0, 24.0, 16.0, 12.0, 15.0, 7.0, 4.0, 10.0, 5.0, 1.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-8.499622344970703e-05, -8.279364556074142e-05, -8.059106767177582e-05, -7.838848978281021e-05, -7.61859118938446e-05, -7.3983334004879e-05, -7.178075611591339e-05, -6.957817822694778e-05, -6.737560033798218e-05, -6.517302244901657e-05, -6.297044456005096e-05, -6.076786667108536e-05, -5.856528878211975e-05, -5.6362710893154144e-05, -5.416013300418854e-05, -5.195755511522293e-05, -4.9754977226257324e-05, -4.755239933729172e-05, -4.534982144832611e-05, -4.3147243559360504e-05, -4.09446656703949e-05, -3.874208778142929e-05, -3.6539509892463684e-05, -3.433693200349808e-05, -3.213435411453247e-05, -2.9931776225566864e-05, -2.7729198336601257e-05, -2.552662044763565e-05, -2.3324042558670044e-05, -2.1121464669704437e-05, -1.891888678073883e-05, -1.6716308891773224e-05, -1.4513731002807617e-05, -1.231115311384201e-05, -1.0108575224876404e-05, -7.905997335910797e-06, -5.7034194469451904e-06, -3.5008415579795837e-06, -1.298263669013977e-06, 9.043142199516296e-07, 3.1068921089172363e-06, 5.309469997882843e-06, 7.51204788684845e-06, 9.714625775814056e-06, 1.1917203664779663e-05, 1.411978155374527e-05, 1.6322359442710876e-05, 1.8524937331676483e-05, 2.072751522064209e-05, 2.2930093109607697e-05, 2.5132670998573303e-05, 2.733524888753891e-05, 2.9537826776504517e-05, 3.174040466547012e-05, 3.394298255443573e-05, 3.614556044340134e-05, 3.834813833236694e-05, 4.055071622133255e-05, 4.275329411029816e-05, 4.4955871999263763e-05, 4.715844988822937e-05, 4.936102777719498e-05, 5.1563605666160583e-05, 5.376618355512619e-05, 5.59687614440918e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 11.0, 17.0, 39.0, 61.0, 105.0, 141.0, 249.0, 367.0, 631.0, 1077.0, 1657.0, 2765.0, 4339.0, 6979.0, 11102.0, 17576.0, 26967.0, 40755.0, 59006.0, 81850.0, 104069.0, 121312.0, 125876.0, 116213.0, 97663.0, 74391.0, 52850.0, 36010.0, 23583.0, 15170.0, 9781.0, 6060.0, 3777.0, 2377.0, 1412.0, 850.0, 540.0, 331.0, 205.0, 133.0, 79.0, 60.0, 30.0, 31.0, 16.0, 14.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67626953125, -0.654693603515625, -0.63311767578125, -0.611541748046875, -0.5899658203125, -0.568389892578125, -0.54681396484375, -0.525238037109375, -0.503662109375, -0.482086181640625, -0.46051025390625, -0.438934326171875, -0.4173583984375, -0.395782470703125, -0.37420654296875, -0.352630615234375, -0.3310546875, -0.309478759765625, -0.28790283203125, -0.266326904296875, -0.2447509765625, -0.223175048828125, -0.20159912109375, -0.180023193359375, -0.158447265625, -0.136871337890625, -0.11529541015625, -0.093719482421875, -0.0721435546875, -0.050567626953125, -0.02899169921875, -0.007415771484375, 0.01416015625, 0.035736083984375, 0.05731201171875, 0.078887939453125, 0.1004638671875, 0.122039794921875, 0.14361572265625, 0.165191650390625, 0.186767578125, 0.208343505859375, 0.22991943359375, 0.251495361328125, 0.2730712890625, 0.294647216796875, 0.31622314453125, 0.337799072265625, 0.359375, 0.380950927734375, 0.40252685546875, 0.424102783203125, 0.4456787109375, 0.467254638671875, 0.48883056640625, 0.510406494140625, 0.531982421875, 0.553558349609375, 0.57513427734375, 0.596710205078125, 0.6182861328125, 0.639862060546875, 0.66143798828125, 0.683013916015625, 0.70458984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 6.0, 9.0, 11.0, 13.0, 13.0, 15.0, 18.0, 24.0, 32.0, 28.0, 26.0, 33.0, 40.0, 38.0, 46.0, 42.0, 43.0, 51.0, 38.0, 45.0, 44.0, 39.0, 37.0, 36.0, 36.0, 38.0, 34.0, 25.0, 17.0, 12.0, 17.0, 16.0, 16.0, 7.0, 12.0, 6.0, 5.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268310546875, -0.2587890625, -0.249267578125, -0.23974609375, -0.230224609375, -0.220703125, -0.211181640625, -0.20166015625, -0.192138671875, -0.1826171875, -0.173095703125, -0.16357421875, -0.154052734375, -0.14453125, -0.135009765625, -0.12548828125, -0.115966796875, -0.1064453125, -0.096923828125, -0.08740234375, -0.077880859375, -0.068359375, -0.058837890625, -0.04931640625, -0.039794921875, -0.0302734375, -0.020751953125, -0.01123046875, -0.001708984375, 0.0078125, 0.017333984375, 0.02685546875, 0.036376953125, 0.0458984375, 0.055419921875, 0.06494140625, 0.074462890625, 0.083984375, 0.093505859375, 0.10302734375, 0.112548828125, 0.1220703125, 0.131591796875, 0.14111328125, 0.150634765625, 0.16015625, 0.169677734375, 0.17919921875, 0.188720703125, 0.1982421875, 0.207763671875, 0.21728515625, 0.226806640625, 0.236328125, 0.245849609375, 0.25537109375, 0.264892578125, 0.2744140625, 0.283935546875, 0.29345703125, 0.302978515625, 0.3125, 0.322021484375, 0.33154296875, 0.341064453125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 15.0, 8.0, 12.0, 11.0, 16.0, 22.0, 24.0, 31.0, 38.0, 35.0, 45.0, 56.0, 42.0, 47.0, 42.0, 47.0, 56.0, 43.0, 60.0, 43.0, 49.0, 38.0, 28.0, 36.0, 35.0, 15.0, 17.0, 21.0, 12.0, 6.0, 14.0, 10.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.721406936645508, -17.143901824951172, -16.566396713256836, -15.9888916015625, -15.411385536193848, -14.833880424499512, -14.256375312805176, -13.678869247436523, -13.101364135742188, -12.523859024047852, -11.946353912353516, -11.36884880065918, -10.791342735290527, -10.213837623596191, -9.636332511901855, -9.058826446533203, -8.481322288513184, -7.903817176818848, -7.3263115882873535, -6.748806476593018, -6.171300888061523, -5.5937957763671875, -5.016290664672852, -4.438785076141357, -3.8612799644470215, -3.2837746143341064, -2.7062692642211914, -2.1287641525268555, -1.5512588024139404, -0.9737534523010254, -0.39624834060668945, 0.1812572479248047, 0.7587623596191406, 1.3362677097320557, 1.9137729406356812, 2.4912781715393066, 3.0687835216522217, 3.6462888717651367, 4.223793983459473, 4.801299571990967, 5.378804683685303, 5.956309795379639, 6.533815383911133, 7.111320495605469, 7.688825607299805, 8.26633071899414, 8.843835830688477, 9.421341896057129, 9.998847007751465, 10.5763521194458, 11.153857231140137, 11.731363296508789, 12.308868408203125, 12.886373519897461, 13.463878631591797, 14.041383743286133, 14.618888854980469, 15.196393966674805, 15.77389907836914, 16.351404190063477, 16.928909301757812, 17.50641632080078, 18.083919525146484, 18.661426544189453, 19.23893165588379]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 3.0, 2.0, 12.0, 9.0, 11.0, 14.0, 15.0, 24.0, 20.0, 24.0, 41.0, 27.0, 27.0, 40.0, 31.0, 51.0, 33.0, 47.0, 40.0, 35.0, 54.0, 35.0, 41.0, 40.0, 39.0, 37.0, 26.0, 32.0, 29.0, 23.0, 23.0, 25.0, 23.0, 8.0, 7.0, 10.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-19.69591522216797, -19.156055450439453, -18.616195678710938, -18.076337814331055, -17.53647804260254, -16.996618270874023, -16.456758499145508, -15.916899681091309, -15.37704086303711, -14.837181091308594, -14.297322273254395, -13.757462501525879, -13.21760368347168, -12.677743911743164, -12.137884140014648, -11.59802532196045, -11.058165550231934, -10.518305778503418, -9.978446960449219, -9.438587188720703, -8.898728370666504, -8.358868598937988, -7.819009304046631, -7.279150009155273, -6.739290714263916, -6.199431419372559, -5.659572124481201, -5.119712829589844, -4.579853057861328, -4.039994239807129, -3.5001344680786133, -2.960275173187256, -2.420414924621582, -1.8805556297302246, -1.3406962156295776, -0.8008368015289307, -0.26097750663757324, 0.2788817882537842, 0.8187413215637207, 1.3586006164550781, 1.8984599113464355, 2.438319206237793, 2.9781785011291504, 3.518038034439087, 4.057897567749023, 4.597756385803223, 5.137616157531738, 5.677475452423096, 6.217334747314453, 6.7571940422058105, 7.297053337097168, 7.836913108825684, 8.376771926879883, 8.916631698608398, 9.456491470336914, 9.996350288391113, 10.536209106445312, 11.076068878173828, 11.615927696228027, 12.155787467956543, 12.695646286010742, 13.235506057739258, 13.775365829467773, 14.315224647521973, 14.855084419250488]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 14.0, 17.0, 36.0, 49.0, 71.0, 129.0, 191.0, 318.0, 483.0, 798.0, 1300.0, 2081.0, 3383.0, 5592.0, 8917.0, 14152.0, 21537.0, 32795.0, 46858.0, 64420.0, 82127.0, 98116.0, 110115.0, 112663.0, 105678.0, 91251.0, 74179.0, 55739.0, 39763.0, 27490.0, 17785.0, 11403.0, 7318.0, 4584.0, 2758.0, 1670.0, 1030.0, 693.0, 383.0, 250.0, 151.0, 104.0, 56.0, 41.0, 24.0, 17.0, 10.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.203125, -11.771484375, -11.33984375, -10.908203125, -10.4765625, -10.044921875, -9.61328125, -9.181640625, -8.75, -8.318359375, -7.88671875, -7.455078125, -7.0234375, -6.591796875, -6.16015625, -5.728515625, -5.296875, -4.865234375, -4.43359375, -4.001953125, -3.5703125, -3.138671875, -2.70703125, -2.275390625, -1.84375, -1.412109375, -0.98046875, -0.548828125, -0.1171875, 0.314453125, 0.74609375, 1.177734375, 1.609375, 2.041015625, 2.47265625, 2.904296875, 3.3359375, 3.767578125, 4.19921875, 4.630859375, 5.0625, 5.494140625, 5.92578125, 6.357421875, 6.7890625, 7.220703125, 7.65234375, 8.083984375, 8.515625, 8.947265625, 9.37890625, 9.810546875, 10.2421875, 10.673828125, 11.10546875, 11.537109375, 11.96875, 12.400390625, 12.83203125, 13.263671875, 13.6953125, 14.126953125, 14.55859375, 14.990234375, 15.421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 2.0, 9.0, 11.0, 10.0, 13.0, 21.0, 19.0, 19.0, 22.0, 39.0, 30.0, 28.0, 37.0, 30.0, 52.0, 33.0, 46.0, 38.0, 39.0, 54.0, 33.0, 41.0, 39.0, 46.0, 34.0, 24.0, 32.0, 30.0, 17.0, 27.0, 27.0, 20.0, 15.0, 6.0, 10.0, 11.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-18.9375, -18.4207763671875, -17.904052734375, -17.3873291015625, -16.87060546875, -16.3538818359375, -15.837158203125, -15.3204345703125, -14.8037109375, -14.2869873046875, -13.770263671875, -13.2535400390625, -12.73681640625, -12.2200927734375, -11.703369140625, -11.1866455078125, -10.669921875, -10.1531982421875, -9.636474609375, -9.1197509765625, -8.60302734375, -8.0863037109375, -7.569580078125, -7.0528564453125, -6.5361328125, -6.0194091796875, -5.502685546875, -4.9859619140625, -4.46923828125, -3.9525146484375, -3.435791015625, -2.9190673828125, -2.40234375, -1.8856201171875, -1.368896484375, -0.8521728515625, -0.33544921875, 0.1812744140625, 0.697998046875, 1.2147216796875, 1.7314453125, 2.2481689453125, 2.764892578125, 3.2816162109375, 3.79833984375, 4.3150634765625, 4.831787109375, 5.3485107421875, 5.865234375, 6.3819580078125, 6.898681640625, 7.4154052734375, 7.93212890625, 8.4488525390625, 8.965576171875, 9.4822998046875, 9.9990234375, 10.5157470703125, 11.032470703125, 11.5491943359375, 12.06591796875, 12.5826416015625, 13.099365234375, 13.6160888671875, 14.1328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 11.0, 11.0, 11.0, 24.0, 41.0, 53.0, 80.0, 111.0, 209.0, 282.0, 464.0, 644.0, 1004.0, 1543.0, 2326.0, 3631.0, 5648.0, 8757.0, 13000.0, 19431.0, 28152.0, 40362.0, 54974.0, 71174.0, 87294.0, 99099.0, 105986.0, 104947.0, 95828.0, 81546.0, 64752.0, 48890.0, 35190.0, 24564.0, 16411.0, 11035.0, 7294.0, 4838.0, 3084.0, 1968.0, 1298.0, 917.0, 585.0, 383.0, 227.0, 162.0, 103.0, 83.0, 52.0, 32.0, 20.0, 8.0, 9.0, 3.0, 6.0, 2.0, 4.0], "bins": [-13.1640625, -12.774658203125, -12.38525390625, -11.995849609375, -11.6064453125, -11.217041015625, -10.82763671875, -10.438232421875, -10.048828125, -9.659423828125, -9.27001953125, -8.880615234375, -8.4912109375, -8.101806640625, -7.71240234375, -7.322998046875, -6.93359375, -6.544189453125, -6.15478515625, -5.765380859375, -5.3759765625, -4.986572265625, -4.59716796875, -4.207763671875, -3.818359375, -3.428955078125, -3.03955078125, -2.650146484375, -2.2607421875, -1.871337890625, -1.48193359375, -1.092529296875, -0.703125, -0.313720703125, 0.07568359375, 0.465087890625, 0.8544921875, 1.243896484375, 1.63330078125, 2.022705078125, 2.412109375, 2.801513671875, 3.19091796875, 3.580322265625, 3.9697265625, 4.359130859375, 4.74853515625, 5.137939453125, 5.52734375, 5.916748046875, 6.30615234375, 6.695556640625, 7.0849609375, 7.474365234375, 7.86376953125, 8.253173828125, 8.642578125, 9.031982421875, 9.42138671875, 9.810791015625, 10.2001953125, 10.589599609375, 10.97900390625, 11.368408203125, 11.7578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 8.0, 3.0, 3.0, 8.0, 14.0, 14.0, 18.0, 21.0, 29.0, 30.0, 36.0, 37.0, 38.0, 38.0, 38.0, 52.0, 51.0, 46.0, 45.0, 46.0, 34.0, 39.0, 54.0, 41.0, 42.0, 43.0, 21.0, 25.0, 23.0, 23.0, 17.0, 9.0, 10.0, 11.0, 6.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.213623046875, -12.84130859375, -12.468994140625, -12.0966796875, -11.724365234375, -11.35205078125, -10.979736328125, -10.607421875, -10.235107421875, -9.86279296875, -9.490478515625, -9.1181640625, -8.745849609375, -8.37353515625, -8.001220703125, -7.62890625, -7.256591796875, -6.88427734375, -6.511962890625, -6.1396484375, -5.767333984375, -5.39501953125, -5.022705078125, -4.650390625, -4.278076171875, -3.90576171875, -3.533447265625, -3.1611328125, -2.788818359375, -2.41650390625, -2.044189453125, -1.671875, -1.299560546875, -0.92724609375, -0.554931640625, -0.1826171875, 0.189697265625, 0.56201171875, 0.934326171875, 1.306640625, 1.678955078125, 2.05126953125, 2.423583984375, 2.7958984375, 3.168212890625, 3.54052734375, 3.912841796875, 4.28515625, 4.657470703125, 5.02978515625, 5.402099609375, 5.7744140625, 6.146728515625, 6.51904296875, 6.891357421875, 7.263671875, 7.635986328125, 8.00830078125, 8.380615234375, 8.7529296875, 9.125244140625, 9.49755859375, 9.869873046875, 10.2421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 11.0, 18.0, 27.0, 52.0, 66.0, 113.0, 173.0, 258.0, 441.0, 858.0, 1480.0, 2636.0, 5189.0, 10235.0, 20605.0, 40899.0, 76879.0, 131091.0, 181637.0, 195770.0, 159186.0, 103548.0, 57493.0, 29232.0, 14850.0, 7361.0, 3861.0, 1955.0, 1061.0, 577.0, 355.0, 218.0, 132.0, 103.0, 69.0, 35.0, 18.0, 17.0, 8.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.9453125, -8.6842041015625, -8.423095703125, -8.1619873046875, -7.90087890625, -7.6397705078125, -7.378662109375, -7.1175537109375, -6.8564453125, -6.5953369140625, -6.334228515625, -6.0731201171875, -5.81201171875, -5.5509033203125, -5.289794921875, -5.0286865234375, -4.767578125, -4.5064697265625, -4.245361328125, -3.9842529296875, -3.72314453125, -3.4620361328125, -3.200927734375, -2.9398193359375, -2.6787109375, -2.4176025390625, -2.156494140625, -1.8953857421875, -1.63427734375, -1.3731689453125, -1.112060546875, -0.8509521484375, -0.58984375, -0.3287353515625, -0.067626953125, 0.1934814453125, 0.45458984375, 0.7156982421875, 0.976806640625, 1.2379150390625, 1.4990234375, 1.7601318359375, 2.021240234375, 2.2823486328125, 2.54345703125, 2.8045654296875, 3.065673828125, 3.3267822265625, 3.587890625, 3.8489990234375, 4.110107421875, 4.3712158203125, 4.63232421875, 4.8934326171875, 5.154541015625, 5.4156494140625, 5.6767578125, 5.9378662109375, 6.198974609375, 6.4600830078125, 6.72119140625, 6.9822998046875, 7.243408203125, 7.5045166015625, 7.765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 19.0, 9.0, 23.0, 18.0, 29.0, 21.0, 26.0, 37.0, 35.0, 41.0, 35.0, 53.0, 43.0, 52.0, 59.0, 56.0, 33.0, 43.0, 49.0, 42.0, 40.0, 29.0, 31.0, 24.0, 17.0, 17.0, 17.0, 15.0, 8.0, 8.0, 7.0, 7.0, 6.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005855560302734375, -0.0005657151341438293, -0.0005458742380142212, -0.000526033341884613, -0.0005061924457550049, -0.00048635154962539673, -0.0004665106534957886, -0.0004466697573661804, -0.00042682886123657227, -0.0004069879651069641, -0.00038714706897735596, -0.0003673061728477478, -0.00034746527671813965, -0.0003276243805885315, -0.00030778348445892334, -0.0002879425883293152, -0.00026810169219970703, -0.0002482607960700989, -0.00022841989994049072, -0.00020857900381088257, -0.00018873810768127441, -0.00016889721155166626, -0.0001490563154220581, -0.00012921541929244995, -0.0001093745231628418, -8.953362703323364e-05, -6.969273090362549e-05, -4.9851834774017334e-05, -3.001093864440918e-05, -1.0170042514801025e-05, 9.670853614807129e-06, 2.9511749744415283e-05, 4.935264587402344e-05, 6.919354200363159e-05, 8.903443813323975e-05, 0.0001088753342628479, 0.00012871623039245605, 0.0001485571265220642, 0.00016839802265167236, 0.00018823891878128052, 0.00020807981491088867, 0.00022792071104049683, 0.000247761607170105, 0.00026760250329971313, 0.0002874433994293213, 0.00030728429555892944, 0.0003271251916885376, 0.00034696608781814575, 0.0003668069839477539, 0.00038664788007736206, 0.0004064887762069702, 0.00042632967233657837, 0.0004461705684661865, 0.0004660114645957947, 0.00048585236072540283, 0.000505693256855011, 0.0005255341529846191, 0.0005453750491142273, 0.0005652159452438354, 0.0005850568413734436, 0.0006048977375030518, 0.0006247386336326599, 0.0006445795297622681, 0.0006644204258918762, 0.0006842613220214844]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 12.0, 25.0, 29.0, 66.0, 86.0, 129.0, 196.0, 270.0, 440.0, 719.0, 1089.0, 1743.0, 2838.0, 5035.0, 8844.0, 15357.0, 28082.0, 49293.0, 82607.0, 126366.0, 164051.0, 171663.0, 144224.0, 100673.0, 61705.0, 35881.0, 19986.0, 11242.0, 6442.0, 3640.0, 2119.0, 1292.0, 858.0, 496.0, 344.0, 228.0, 181.0, 103.0, 72.0, 41.0, 33.0, 22.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.05914306640625, -6.8175048828125, -6.57586669921875, -6.334228515625, -6.09259033203125, -5.8509521484375, -5.60931396484375, -5.36767578125, -5.12603759765625, -4.8843994140625, -4.64276123046875, -4.401123046875, -4.15948486328125, -3.9178466796875, -3.67620849609375, -3.4345703125, -3.19293212890625, -2.9512939453125, -2.70965576171875, -2.468017578125, -2.22637939453125, -1.9847412109375, -1.74310302734375, -1.50146484375, -1.25982666015625, -1.0181884765625, -0.77655029296875, -0.534912109375, -0.29327392578125, -0.0516357421875, 0.19000244140625, 0.431640625, 0.67327880859375, 0.9149169921875, 1.15655517578125, 1.398193359375, 1.63983154296875, 1.8814697265625, 2.12310791015625, 2.36474609375, 2.60638427734375, 2.8480224609375, 3.08966064453125, 3.331298828125, 3.57293701171875, 3.8145751953125, 4.05621337890625, 4.2978515625, 4.53948974609375, 4.7811279296875, 5.02276611328125, 5.264404296875, 5.50604248046875, 5.7476806640625, 5.98931884765625, 6.23095703125, 6.47259521484375, 6.7142333984375, 6.95587158203125, 7.197509765625, 7.43914794921875, 7.6807861328125, 7.92242431640625, 8.1640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 6.0, 8.0, 14.0, 25.0, 15.0, 25.0, 39.0, 50.0, 53.0, 54.0, 51.0, 58.0, 64.0, 52.0, 43.0, 51.0, 42.0, 60.0, 50.0, 34.0, 36.0, 46.0, 24.0, 11.0, 14.0, 11.0, 11.0, 6.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.224609375, -3.134552001953125, -3.04449462890625, -2.954437255859375, -2.8643798828125, -2.774322509765625, -2.68426513671875, -2.594207763671875, -2.504150390625, -2.414093017578125, -2.32403564453125, -2.233978271484375, -2.1439208984375, -2.053863525390625, -1.96380615234375, -1.873748779296875, -1.78369140625, -1.693634033203125, -1.60357666015625, -1.513519287109375, -1.4234619140625, -1.333404541015625, -1.24334716796875, -1.153289794921875, -1.063232421875, -0.973175048828125, -0.88311767578125, -0.793060302734375, -0.7030029296875, -0.612945556640625, -0.52288818359375, -0.432830810546875, -0.3427734375, -0.252716064453125, -0.16265869140625, -0.072601318359375, 0.0174560546875, 0.107513427734375, 0.19757080078125, 0.287628173828125, 0.377685546875, 0.467742919921875, 0.55780029296875, 0.647857666015625, 0.7379150390625, 0.827972412109375, 0.91802978515625, 1.008087158203125, 1.09814453125, 1.188201904296875, 1.27825927734375, 1.368316650390625, 1.4583740234375, 1.548431396484375, 1.63848876953125, 1.728546142578125, 1.818603515625, 1.908660888671875, 1.99871826171875, 2.088775634765625, 2.1788330078125, 2.268890380859375, 2.35894775390625, 2.449005126953125, 2.5390625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 0.0, 10.0, 4.0, 14.0, 4.0, 21.0, 25.0, 17.0, 17.0, 29.0, 29.0, 35.0, 41.0, 37.0, 43.0, 45.0, 41.0, 52.0, 38.0, 44.0, 53.0, 45.0, 37.0, 49.0, 36.0, 26.0, 37.0, 29.0, 19.0, 14.0, 11.0, 20.0, 18.0, 9.0, 8.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.019598007202148, -14.498157501220703, -13.976716995239258, -13.455277442932129, -12.933836936950684, -12.412396430969238, -11.89095687866211, -11.369516372680664, -10.848075866699219, -10.326635360717773, -9.805194854736328, -9.2837553024292, -8.762314796447754, -8.240874290466309, -7.7194342613220215, -7.197994232177734, -6.676553726196289, -6.155113220214844, -5.633673191070557, -5.1122331619262695, -4.590792655944824, -4.069352149963379, -3.547912120819092, -3.0264718532562256, -2.5050315856933594, -1.9835913181304932, -1.462151050567627, -0.9407107830047607, -0.41927051544189453, 0.10216975212097168, 0.6236100196838379, 1.145050287246704, 1.6664905548095703, 2.1879308223724365, 2.7093710899353027, 3.230811357498169, 3.752251625061035, 4.2736921310424805, 4.795132160186768, 5.316572189331055, 5.8380126953125, 6.359453201293945, 6.880893230438232, 7.4023332595825195, 7.923773765563965, 8.44521427154541, 8.966653823852539, 9.488094329833984, 10.00953483581543, 10.530975341796875, 11.05241584777832, 11.57385540008545, 12.095295906066895, 12.61673641204834, 13.138175964355469, 13.659616470336914, 14.18105697631836, 14.702497482299805, 15.22393798828125, 15.745377540588379, 16.26681900024414, 16.788257598876953, 17.3096981048584, 17.831138610839844, 18.35257911682129]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 4.0, 7.0, 10.0, 15.0, 13.0, 20.0, 16.0, 21.0, 21.0, 28.0, 32.0, 26.0, 37.0, 42.0, 38.0, 29.0, 29.0, 40.0, 43.0, 27.0, 40.0, 32.0, 51.0, 30.0, 34.0, 34.0, 19.0, 25.0, 34.0, 21.0, 19.0, 20.0, 17.0, 23.0, 13.0, 10.0, 10.0, 11.0, 6.0, 6.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.489995956420898, -14.008938789367676, -13.527880668640137, -13.046823501586914, -12.565766334533691, -12.084709167480469, -11.60365104675293, -11.122593879699707, -10.641536712646484, -10.160479545593262, -9.679421424865723, -9.1983642578125, -8.717307090759277, -8.236249923706055, -7.755191802978516, -7.274134635925293, -6.793076515197754, -6.312018871307373, -5.83096170425415, -5.3499040603637695, -4.868846893310547, -4.387789249420166, -3.906731605529785, -3.4256742000579834, -2.9446167945861816, -2.46355938911438, -1.9825018644332886, -1.5014443397521973, -1.0203869342803955, -0.5393295288085938, -0.05827188491821289, 0.42278552055358887, 0.9038429260253906, 1.3849003314971924, 1.8659578561782837, 2.347015380859375, 2.8280727863311768, 3.3091301918029785, 3.7901878356933594, 4.271245002746582, 4.752302646636963, 5.233360290527344, 5.714417457580566, 6.195475101470947, 6.676532745361328, 7.157589912414551, 7.638647556304932, 8.119705200195312, 8.600762367248535, 9.081819534301758, 9.562877655029297, 10.04393482208252, 10.524991989135742, 11.006050109863281, 11.487107276916504, 11.968164443969727, 12.449222564697266, 12.930279731750488, 13.411337852478027, 13.89239501953125, 14.373452186584473, 14.854509353637695, 15.335567474365234, 15.816624641418457, 16.29768180847168]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 17.0, 32.0, 29.0, 52.0, 81.0, 134.0, 198.0, 280.0, 448.0, 680.0, 1012.0, 1685.0, 2677.0, 4401.0, 7209.0, 11761.0, 19451.0, 33003.0, 56196.0, 96301.0, 161772.0, 263419.0, 397278.0, 535010.0, 618217.0, 597751.0, 487061.0, 345780.0, 222250.0, 134153.0, 79799.0, 47082.0, 27954.0, 16128.0, 9781.0, 5703.0, 3601.0, 2175.0, 1328.0, 925.0, 536.0, 328.0, 242.0, 116.0, 91.0, 52.0, 25.0, 23.0, 17.0, 11.0, 9.0, 0.0, 5.0, 3.0], "bins": [-17.375, -16.8759765625, -16.376953125, -15.8779296875, -15.37890625, -14.8798828125, -14.380859375, -13.8818359375, -13.3828125, -12.8837890625, -12.384765625, -11.8857421875, -11.38671875, -10.8876953125, -10.388671875, -9.8896484375, -9.390625, -8.8916015625, -8.392578125, -7.8935546875, -7.39453125, -6.8955078125, -6.396484375, -5.8974609375, -5.3984375, -4.8994140625, -4.400390625, -3.9013671875, -3.40234375, -2.9033203125, -2.404296875, -1.9052734375, -1.40625, -0.9072265625, -0.408203125, 0.0908203125, 0.58984375, 1.0888671875, 1.587890625, 2.0869140625, 2.5859375, 3.0849609375, 3.583984375, 4.0830078125, 4.58203125, 5.0810546875, 5.580078125, 6.0791015625, 6.578125, 7.0771484375, 7.576171875, 8.0751953125, 8.57421875, 9.0732421875, 9.572265625, 10.0712890625, 10.5703125, 11.0693359375, 11.568359375, 12.0673828125, 12.56640625, 13.0654296875, 13.564453125, 14.0634765625, 14.5625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 11.0, 5.0, 4.0, 7.0, 11.0, 14.0, 19.0, 19.0, 17.0, 27.0, 16.0, 27.0, 28.0, 36.0, 37.0, 33.0, 37.0, 29.0, 31.0, 45.0, 36.0, 38.0, 47.0, 37.0, 37.0, 33.0, 27.0, 33.0, 18.0, 25.0, 30.0, 21.0, 24.0, 20.0, 15.0, 21.0, 15.0, 10.0, 7.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.546875, -12.1260986328125, -11.705322265625, -11.2845458984375, -10.86376953125, -10.4429931640625, -10.022216796875, -9.6014404296875, -9.1806640625, -8.7598876953125, -8.339111328125, -7.9183349609375, -7.49755859375, -7.0767822265625, -6.656005859375, -6.2352294921875, -5.814453125, -5.3936767578125, -4.972900390625, -4.5521240234375, -4.13134765625, -3.7105712890625, -3.289794921875, -2.8690185546875, -2.4482421875, -2.0274658203125, -1.606689453125, -1.1859130859375, -0.76513671875, -0.3443603515625, 0.076416015625, 0.4971923828125, 0.91796875, 1.3387451171875, 1.759521484375, 2.1802978515625, 2.60107421875, 3.0218505859375, 3.442626953125, 3.8634033203125, 4.2841796875, 4.7049560546875, 5.125732421875, 5.5465087890625, 5.96728515625, 6.3880615234375, 6.808837890625, 7.2296142578125, 7.650390625, 8.0711669921875, 8.491943359375, 8.9127197265625, 9.33349609375, 9.7542724609375, 10.175048828125, 10.5958251953125, 11.0166015625, 11.4373779296875, 11.858154296875, 12.2789306640625, 12.69970703125, 13.1204833984375, 13.541259765625, 13.9620361328125, 14.3828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 8.0, 14.0, 22.0, 25.0, 46.0, 62.0, 89.0, 136.0, 208.0, 332.0, 489.0, 718.0, 1201.0, 1795.0, 2685.0, 4211.0, 6342.0, 9923.0, 15447.0, 24108.0, 36986.0, 57665.0, 87612.0, 131690.0, 190673.0, 264826.0, 347669.0, 421552.0, 469107.0, 470047.0, 428091.0, 354665.0, 272048.0, 196415.0, 136424.0, 91386.0, 60343.0, 38865.0, 25227.0, 15848.0, 10264.0, 6643.0, 4319.0, 2768.0, 1806.0, 1189.0, 800.0, 522.0, 343.0, 227.0, 158.0, 96.0, 54.0, 44.0, 21.0, 14.0, 10.0, 8.0, 5.0, 0.0, 4.0], "bins": [-13.6171875, -13.1922607421875, -12.767333984375, -12.3424072265625, -11.91748046875, -11.4925537109375, -11.067626953125, -10.6427001953125, -10.2177734375, -9.7928466796875, -9.367919921875, -8.9429931640625, -8.51806640625, -8.0931396484375, -7.668212890625, -7.2432861328125, -6.818359375, -6.3934326171875, -5.968505859375, -5.5435791015625, -5.11865234375, -4.6937255859375, -4.268798828125, -3.8438720703125, -3.4189453125, -2.9940185546875, -2.569091796875, -2.1441650390625, -1.71923828125, -1.2943115234375, -0.869384765625, -0.4444580078125, -0.01953125, 0.4053955078125, 0.830322265625, 1.2552490234375, 1.68017578125, 2.1051025390625, 2.530029296875, 2.9549560546875, 3.3798828125, 3.8048095703125, 4.229736328125, 4.6546630859375, 5.07958984375, 5.5045166015625, 5.929443359375, 6.3543701171875, 6.779296875, 7.2042236328125, 7.629150390625, 8.0540771484375, 8.47900390625, 8.9039306640625, 9.328857421875, 9.7537841796875, 10.1787109375, 10.6036376953125, 11.028564453125, 11.4534912109375, 11.87841796875, 12.3033447265625, 12.728271484375, 13.1531982421875, 13.578125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 4.0, 11.0, 13.0, 18.0, 27.0, 27.0, 41.0, 40.0, 59.0, 62.0, 85.0, 79.0, 89.0, 116.0, 138.0, 155.0, 147.0, 201.0, 194.0, 217.0, 178.0, 207.0, 217.0, 200.0, 216.0, 188.0, 194.0, 162.0, 124.0, 98.0, 107.0, 85.0, 65.0, 66.0, 63.0, 46.0, 28.0, 27.0, 27.0, 11.0, 9.0, 11.0, 4.0, 7.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.4296875, -7.2138671875, -6.998046875, -6.7822265625, -6.56640625, -6.3505859375, -6.134765625, -5.9189453125, -5.703125, -5.4873046875, -5.271484375, -5.0556640625, -4.83984375, -4.6240234375, -4.408203125, -4.1923828125, -3.9765625, -3.7607421875, -3.544921875, -3.3291015625, -3.11328125, -2.8974609375, -2.681640625, -2.4658203125, -2.25, -2.0341796875, -1.818359375, -1.6025390625, -1.38671875, -1.1708984375, -0.955078125, -0.7392578125, -0.5234375, -0.3076171875, -0.091796875, 0.1240234375, 0.33984375, 0.5556640625, 0.771484375, 0.9873046875, 1.203125, 1.4189453125, 1.634765625, 1.8505859375, 2.06640625, 2.2822265625, 2.498046875, 2.7138671875, 2.9296875, 3.1455078125, 3.361328125, 3.5771484375, 3.79296875, 4.0087890625, 4.224609375, 4.4404296875, 4.65625, 4.8720703125, 5.087890625, 5.3037109375, 5.51953125, 5.7353515625, 5.951171875, 6.1669921875, 6.3828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 14.0, 9.0, 24.0, 24.0, 24.0, 33.0, 36.0, 42.0, 41.0, 58.0, 63.0, 45.0, 71.0, 59.0, 48.0, 52.0, 61.0, 44.0, 45.0, 42.0, 26.0, 27.0, 18.0, 20.0, 18.0, 8.0, 5.0, 13.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.374731063842773, -19.740201950073242, -19.105670928955078, -18.471141815185547, -17.836610794067383, -17.20208168029785, -16.567550659179688, -15.933021545410156, -15.298492431640625, -14.663962364196777, -14.02943229675293, -13.394903182983398, -12.76037311553955, -12.125843048095703, -11.491312980651855, -10.856782913208008, -10.22225284576416, -9.587722778320312, -8.953192710876465, -8.318662643432617, -7.684133529663086, -7.049603462219238, -6.415073394775391, -5.780543804168701, -5.1460137367248535, -4.511483669281006, -3.8769540786743164, -3.2424240112304688, -2.6078941822052, -1.9733643531799316, -1.338834285736084, -0.7043046951293945, -0.06977462768554688, 0.5647552609443665, 1.1992851495742798, 1.833815097808838, 2.4683449268341064, 3.102874755859375, 3.7374048233032227, 4.371934413909912, 5.00646448135376, 5.640994548797607, 6.275524139404297, 6.9100542068481445, 7.544584274291992, 8.179113388061523, 8.813644409179688, 9.448173522949219, 10.082703590393066, 10.717233657836914, 11.351763725280762, 11.98629379272461, 12.62082290649414, 13.255352973937988, 13.889883041381836, 14.524412155151367, 15.158943176269531, 15.793473243713379, 16.428003311157227, 17.062532424926758, 17.697063446044922, 18.331592559814453, 18.966121673583984, 19.60065269470215, 20.23518180847168]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 7.0, 6.0, 7.0, 17.0, 13.0, 15.0, 28.0, 28.0, 28.0, 21.0, 34.0, 45.0, 35.0, 41.0, 34.0, 41.0, 46.0, 49.0, 53.0, 34.0, 32.0, 48.0, 36.0, 35.0, 34.0, 31.0, 31.0, 28.0, 18.0, 18.0, 20.0, 14.0, 17.0, 9.0, 7.0, 8.0, 2.0, 3.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.138290405273438, -16.615663528442383, -16.093036651611328, -15.57040786743164, -15.047780990600586, -14.525154113769531, -14.00252628326416, -13.479898452758789, -12.957271575927734, -12.43464469909668, -11.912016868591309, -11.389389038085938, -10.866762161254883, -10.344135284423828, -9.821507453918457, -9.298879623413086, -8.776252746582031, -8.253625869750977, -7.7309980392456055, -7.208370685577393, -6.68574333190918, -6.163115978240967, -5.640488624572754, -5.117861270904541, -4.595233917236328, -4.072606563568115, -3.5499792098999023, -3.0273518562316895, -2.5047245025634766, -1.9820971488952637, -1.4594697952270508, -0.9368424415588379, -0.4142169952392578, 0.10841035842895508, 0.631037712097168, 1.1536650657653809, 1.6762924194335938, 2.1989197731018066, 2.7215471267700195, 3.2441744804382324, 3.7668018341064453, 4.289429187774658, 4.812056541442871, 5.334683895111084, 5.857311248779297, 6.37993860244751, 6.902565956115723, 7.4251933097839355, 7.947820663452148, 8.470447540283203, 8.993075370788574, 9.515703201293945, 10.038330078125, 10.560956954956055, 11.083584785461426, 11.606212615966797, 12.128839492797852, 12.651466369628906, 13.174094200134277, 13.696722030639648, 14.219348907470703, 14.741975784301758, 15.264603614807129, 15.7872314453125, 16.309858322143555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 12.0, 29.0, 41.0, 54.0, 124.0, 204.0, 350.0, 608.0, 1037.0, 1866.0, 3303.0, 5476.0, 9675.0, 15770.0, 26117.0, 41374.0, 63190.0, 93087.0, 122856.0, 144924.0, 143643.0, 120910.0, 89960.0, 61974.0, 40062.0, 24939.0, 15170.0, 9180.0, 5229.0, 3173.0, 1788.0, 984.0, 604.0, 348.0, 197.0, 126.0, 62.0, 37.0, 23.0, 16.0, 6.0, 8.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.746856689453125, -3.61285400390625, -3.478851318359375, -3.3448486328125, -3.210845947265625, -3.07684326171875, -2.942840576171875, -2.808837890625, -2.674835205078125, -2.54083251953125, -2.406829833984375, -2.2728271484375, -2.138824462890625, -2.00482177734375, -1.870819091796875, -1.73681640625, -1.602813720703125, -1.46881103515625, -1.334808349609375, -1.2008056640625, -1.066802978515625, -0.93280029296875, -0.798797607421875, -0.664794921875, -0.530792236328125, -0.39678955078125, -0.262786865234375, -0.1287841796875, 0.005218505859375, 0.13922119140625, 0.273223876953125, 0.4072265625, 0.541229248046875, 0.67523193359375, 0.809234619140625, 0.9432373046875, 1.077239990234375, 1.21124267578125, 1.345245361328125, 1.479248046875, 1.613250732421875, 1.74725341796875, 1.881256103515625, 2.0152587890625, 2.149261474609375, 2.28326416015625, 2.417266845703125, 2.55126953125, 2.685272216796875, 2.81927490234375, 2.953277587890625, 3.0872802734375, 3.221282958984375, 3.35528564453125, 3.489288330078125, 3.623291015625, 3.757293701171875, 3.89129638671875, 4.025299072265625, 4.1593017578125, 4.293304443359375, 4.42730712890625, 4.561309814453125, 4.6953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 5.0, 8.0, 5.0, 8.0, 16.0, 13.0, 15.0, 29.0, 30.0, 25.0, 21.0, 36.0, 45.0, 35.0, 39.0, 34.0, 42.0, 46.0, 49.0, 53.0, 33.0, 33.0, 46.0, 35.0, 37.0, 32.0, 33.0, 29.0, 29.0, 18.0, 17.0, 21.0, 14.0, 17.0, 10.0, 6.0, 8.0, 3.0, 3.0, 6.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.125, -16.60400390625, -16.0830078125, -15.56201171875, -15.041015625, -14.52001953125, -13.9990234375, -13.47802734375, -12.95703125, -12.43603515625, -11.9150390625, -11.39404296875, -10.873046875, -10.35205078125, -9.8310546875, -9.31005859375, -8.7890625, -8.26806640625, -7.7470703125, -7.22607421875, -6.705078125, -6.18408203125, -5.6630859375, -5.14208984375, -4.62109375, -4.10009765625, -3.5791015625, -3.05810546875, -2.537109375, -2.01611328125, -1.4951171875, -0.97412109375, -0.453125, 0.06787109375, 0.5888671875, 1.10986328125, 1.630859375, 2.15185546875, 2.6728515625, 3.19384765625, 3.71484375, 4.23583984375, 4.7568359375, 5.27783203125, 5.798828125, 6.31982421875, 6.8408203125, 7.36181640625, 7.8828125, 8.40380859375, 8.9248046875, 9.44580078125, 9.966796875, 10.48779296875, 11.0087890625, 11.52978515625, 12.05078125, 12.57177734375, 13.0927734375, 13.61376953125, 14.134765625, 14.65576171875, 15.1767578125, 15.69775390625, 16.21875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 4.0, 7.0, 5.0, 8.0, 19.0, 29.0, 46.0, 70.0, 71.0, 145.0, 209.0, 310.0, 489.0, 781.0, 1214.0, 2082.0, 3831.0, 6590.0, 12352.0, 23607.0, 71497.0, 843785.0, 39864.0, 18648.0, 9776.0, 5313.0, 3105.0, 1816.0, 1015.0, 608.0, 428.0, 287.0, 172.0, 108.0, 94.0, 34.0, 33.0, 31.0, 23.0, 16.0, 6.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.8359375, -14.3907470703125, -13.945556640625, -13.5003662109375, -13.05517578125, -12.6099853515625, -12.164794921875, -11.7196044921875, -11.2744140625, -10.8292236328125, -10.384033203125, -9.9388427734375, -9.49365234375, -9.0484619140625, -8.603271484375, -8.1580810546875, -7.712890625, -7.2677001953125, -6.822509765625, -6.3773193359375, -5.93212890625, -5.4869384765625, -5.041748046875, -4.5965576171875, -4.1513671875, -3.7061767578125, -3.260986328125, -2.8157958984375, -2.37060546875, -1.9254150390625, -1.480224609375, -1.0350341796875, -0.58984375, -0.1446533203125, 0.300537109375, 0.7457275390625, 1.19091796875, 1.6361083984375, 2.081298828125, 2.5264892578125, 2.9716796875, 3.4168701171875, 3.862060546875, 4.3072509765625, 4.75244140625, 5.1976318359375, 5.642822265625, 6.0880126953125, 6.533203125, 6.9783935546875, 7.423583984375, 7.8687744140625, 8.31396484375, 8.7591552734375, 9.204345703125, 9.6495361328125, 10.0947265625, 10.5399169921875, 10.985107421875, 11.4302978515625, 11.87548828125, 12.3206787109375, 12.765869140625, 13.2110595703125, 13.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 11.0, 6.0, 7.0, 6.0, 11.0, 21.0, 11.0, 19.0, 18.0, 21.0, 27.0, 28.0, 25.0, 30.0, 30.0, 29.0, 37.0, 33.0, 50.0, 35.0, 45.0, 26.0, 43.0, 36.0, 24.0, 31.0, 38.0, 34.0, 28.0, 30.0, 26.0, 26.0, 22.0, 27.0, 12.0, 18.0, 17.0, 6.0, 9.0, 11.0, 6.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0, -9.697021484375, -9.39404296875, -9.091064453125, -8.7880859375, -8.485107421875, -8.18212890625, -7.879150390625, -7.576171875, -7.273193359375, -6.97021484375, -6.667236328125, -6.3642578125, -6.061279296875, -5.75830078125, -5.455322265625, -5.15234375, -4.849365234375, -4.54638671875, -4.243408203125, -3.9404296875, -3.637451171875, -3.33447265625, -3.031494140625, -2.728515625, -2.425537109375, -2.12255859375, -1.819580078125, -1.5166015625, -1.213623046875, -0.91064453125, -0.607666015625, -0.3046875, -0.001708984375, 0.30126953125, 0.604248046875, 0.9072265625, 1.210205078125, 1.51318359375, 1.816162109375, 2.119140625, 2.422119140625, 2.72509765625, 3.028076171875, 3.3310546875, 3.634033203125, 3.93701171875, 4.239990234375, 4.54296875, 4.845947265625, 5.14892578125, 5.451904296875, 5.7548828125, 6.057861328125, 6.36083984375, 6.663818359375, 6.966796875, 7.269775390625, 7.57275390625, 7.875732421875, 8.1787109375, 8.481689453125, 8.78466796875, 9.087646484375, 9.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 8.0, 14.0, 20.0, 50.0, 72.0, 80.0, 157.0, 209.0, 424.0, 713.0, 1284.0, 2310.0, 4513.0, 8682.0, 17530.0, 40395.0, 839344.0, 83882.0, 24178.0, 11748.0, 6025.0, 3102.0, 1640.0, 862.0, 506.0, 315.0, 168.0, 102.0, 66.0, 43.0, 35.0, 22.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8115234375, -0.7859344482421875, -0.760345458984375, -0.7347564697265625, -0.70916748046875, -0.6835784912109375, -0.657989501953125, -0.6324005126953125, -0.6068115234375, -0.5812225341796875, -0.555633544921875, -0.5300445556640625, -0.50445556640625, -0.4788665771484375, -0.453277587890625, -0.4276885986328125, -0.402099609375, -0.3765106201171875, -0.350921630859375, -0.3253326416015625, -0.29974365234375, -0.2741546630859375, -0.248565673828125, -0.2229766845703125, -0.1973876953125, -0.1717987060546875, -0.146209716796875, -0.1206207275390625, -0.09503173828125, -0.0694427490234375, -0.043853759765625, -0.0182647705078125, 0.00732421875, 0.0329132080078125, 0.058502197265625, 0.0840911865234375, 0.10968017578125, 0.1352691650390625, 0.160858154296875, 0.1864471435546875, 0.2120361328125, 0.2376251220703125, 0.263214111328125, 0.2888031005859375, 0.31439208984375, 0.3399810791015625, 0.365570068359375, 0.3911590576171875, 0.416748046875, 0.4423370361328125, 0.467926025390625, 0.4935150146484375, 0.51910400390625, 0.5446929931640625, 0.570281982421875, 0.5958709716796875, 0.6214599609375, 0.6470489501953125, 0.672637939453125, 0.6982269287109375, 0.72381591796875, 0.7494049072265625, 0.774993896484375, 0.8005828857421875, 0.826171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 2.0, 4.0, 9.0, 5.0, 4.0, 9.0, 9.0, 9.0, 27.0, 25.0, 19.0, 32.0, 31.0, 25.0, 44.0, 60.0, 53.0, 52.0, 41.0, 53.0, 54.0, 57.0, 51.0, 42.0, 53.0, 33.0, 29.0, 25.0, 29.0, 22.0, 16.0, 12.0, 19.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.93986701965332e-05, -3.82671132683754e-05, -3.713555634021759e-05, -3.6003999412059784e-05, -3.487244248390198e-05, -3.374088555574417e-05, -3.2609328627586365e-05, -3.147777169942856e-05, -3.0346214771270752e-05, -2.9214657843112946e-05, -2.808310091495514e-05, -2.6951543986797333e-05, -2.5819987058639526e-05, -2.468843013048172e-05, -2.3556873202323914e-05, -2.2425316274166107e-05, -2.12937593460083e-05, -2.0162202417850494e-05, -1.9030645489692688e-05, -1.789908856153488e-05, -1.6767531633377075e-05, -1.563597470521927e-05, -1.4504417777061462e-05, -1.3372860848903656e-05, -1.224130392074585e-05, -1.1109746992588043e-05, -9.978190064430237e-06, -8.84663313627243e-06, -7.715076208114624e-06, -6.583519279956818e-06, -5.451962351799011e-06, -4.320405423641205e-06, -3.1888484954833984e-06, -2.057291567325592e-06, -9.257346391677856e-07, 2.0582228899002075e-07, 1.3373792171478271e-06, 2.4689361453056335e-06, 3.60049307346344e-06, 4.732050001621246e-06, 5.863606929779053e-06, 6.995163857936859e-06, 8.126720786094666e-06, 9.258277714252472e-06, 1.0389834642410278e-05, 1.1521391570568085e-05, 1.2652948498725891e-05, 1.3784505426883698e-05, 1.4916062355041504e-05, 1.604761928319931e-05, 1.7179176211357117e-05, 1.8310733139514923e-05, 1.944229006767273e-05, 2.0573846995830536e-05, 2.1705403923988342e-05, 2.283696085214615e-05, 2.3968517780303955e-05, 2.510007470846176e-05, 2.6231631636619568e-05, 2.7363188564777374e-05, 2.849474549293518e-05, 2.9626302421092987e-05, 3.0757859349250793e-05, 3.18894162774086e-05, 3.3020973205566406e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 18.0, 18.0, 36.0, 49.0, 89.0, 151.0, 225.0, 368.0, 553.0, 839.0, 1276.0, 1846.0, 2893.0, 4360.0, 6360.0, 9382.0, 13638.0, 20250.0, 29208.0, 41834.0, 58219.0, 78760.0, 99552.0, 117711.0, 122132.0, 110567.0, 91141.0, 69978.0, 51524.0, 36383.0, 25566.0, 17217.0, 12031.0, 7819.0, 5530.0, 3748.0, 2492.0, 1641.0, 1112.0, 753.0, 466.0, 309.0, 209.0, 108.0, 74.0, 51.0, 21.0, 21.0, 14.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5767898559570312, -0.5583648681640625, -0.5399398803710938, -0.521514892578125, -0.5030899047851562, -0.4846649169921875, -0.46623992919921875, -0.44781494140625, -0.42938995361328125, -0.4109649658203125, -0.39253997802734375, -0.374114990234375, -0.35569000244140625, -0.3372650146484375, -0.31884002685546875, -0.3004150390625, -0.28199005126953125, -0.2635650634765625, -0.24514007568359375, -0.226715087890625, -0.20829010009765625, -0.1898651123046875, -0.17144012451171875, -0.15301513671875, -0.13459014892578125, -0.1161651611328125, -0.09774017333984375, -0.079315185546875, -0.06089019775390625, -0.0424652099609375, -0.02404022216796875, -0.005615234375, 0.01280975341796875, 0.0312347412109375, 0.04965972900390625, 0.068084716796875, 0.08650970458984375, 0.1049346923828125, 0.12335968017578125, 0.14178466796875, 0.16020965576171875, 0.1786346435546875, 0.19705963134765625, 0.215484619140625, 0.23390960693359375, 0.2523345947265625, 0.27075958251953125, 0.2891845703125, 0.30760955810546875, 0.3260345458984375, 0.34445953369140625, 0.362884521484375, 0.38130950927734375, 0.3997344970703125, 0.41815948486328125, 0.43658447265625, 0.45500946044921875, 0.4734344482421875, 0.49185943603515625, 0.510284423828125, 0.5287094116210938, 0.5471343994140625, 0.5655593872070312, 0.583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 8.0, 5.0, 4.0, 10.0, 12.0, 5.0, 4.0, 10.0, 16.0, 21.0, 21.0, 16.0, 25.0, 45.0, 27.0, 48.0, 33.0, 48.0, 52.0, 49.0, 43.0, 44.0, 43.0, 49.0, 47.0, 45.0, 29.0, 41.0, 32.0, 24.0, 23.0, 29.0, 10.0, 19.0, 11.0, 11.0, 8.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.2709312438964844, -0.26256561279296875, -0.2541999816894531, -0.2458343505859375, -0.23746871948242188, -0.22910308837890625, -0.22073745727539062, -0.212371826171875, -0.20400619506835938, -0.19564056396484375, -0.18727493286132812, -0.1789093017578125, -0.17054367065429688, -0.16217803955078125, -0.15381240844726562, -0.14544677734375, -0.13708114624023438, -0.12871551513671875, -0.12034988403320312, -0.1119842529296875, -0.10361862182617188, -0.09525299072265625, -0.08688735961914062, -0.078521728515625, -0.07015609741210938, -0.06179046630859375, -0.053424835205078125, -0.0450592041015625, -0.036693572998046875, -0.02832794189453125, -0.019962310791015625, -0.0115966796875, -0.003231048583984375, 0.00513458251953125, 0.013500213623046875, 0.0218658447265625, 0.030231475830078125, 0.03859710693359375, 0.046962738037109375, 0.055328369140625, 0.06369400024414062, 0.07205963134765625, 0.08042526245117188, 0.0887908935546875, 0.09715652465820312, 0.10552215576171875, 0.11388778686523438, 0.12225341796875, 0.13061904907226562, 0.13898468017578125, 0.14735031127929688, 0.1557159423828125, 0.16408157348632812, 0.17244720458984375, 0.18081283569335938, 0.189178466796875, 0.19754409790039062, 0.20590972900390625, 0.21427536010742188, 0.2226409912109375, 0.23100662231445312, 0.23937225341796875, 0.24773788452148438, 0.256103515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 11.0, 21.0, 27.0, 23.0, 29.0, 38.0, 31.0, 39.0, 52.0, 58.0, 48.0, 71.0, 53.0, 50.0, 61.0, 42.0, 54.0, 45.0, 37.0, 34.0, 35.0, 21.0, 20.0, 20.0, 12.0, 12.0, 5.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.990995407104492, -19.376527786254883, -18.76205825805664, -18.14759063720703, -17.533123016357422, -16.91865348815918, -16.30418586730957, -15.689717292785645, -15.075248718261719, -14.460780143737793, -13.846311569213867, -13.231843948364258, -12.617375373840332, -12.002906799316406, -11.388439178466797, -10.773970603942871, -10.159502029418945, -9.54503345489502, -8.930564880371094, -8.316097259521484, -7.701628684997559, -7.087160110473633, -6.472692012786865, -5.858223915100098, -5.243755340576172, -4.629286766052246, -4.0148186683654785, -3.400350332260132, -2.785881996154785, -2.1714136600494385, -1.5569453239440918, -0.9424772262573242, -0.3280067443847656, 0.28646159172058105, 0.9009299278259277, 1.5153982639312744, 2.129866600036621, 2.7443349361419678, 3.3588032722473145, 3.973271369934082, 4.587739944458008, 5.202208518981934, 5.816676616668701, 6.431144714355469, 7.0456132888793945, 7.66008186340332, 8.27454948425293, 8.889018058776855, 9.503486633300781, 10.117955207824707, 10.732423782348633, 11.346891403198242, 11.961359977722168, 12.575828552246094, 13.190296173095703, 13.804764747619629, 14.419233322143555, 15.03370189666748, 15.648170471191406, 16.262638092041016, 16.877105712890625, 17.491575241088867, 18.106042861938477, 18.72051239013672, 19.334980010986328]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 9.0, 5.0, 6.0, 6.0, 7.0, 17.0, 13.0, 12.0, 24.0, 38.0, 25.0, 21.0, 33.0, 36.0, 43.0, 36.0, 37.0, 42.0, 50.0, 47.0, 53.0, 40.0, 26.0, 48.0, 34.0, 37.0, 34.0, 30.0, 28.0, 33.0, 18.0, 17.0, 20.0, 15.0, 17.0, 11.0, 7.0, 7.0, 2.0, 4.0, 6.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.317588806152344, -16.79276466369629, -16.267940521240234, -15.74311637878418, -15.218292236328125, -14.69346809387207, -14.168643951416016, -13.643819808959961, -13.118995666503906, -12.594171524047852, -12.069347381591797, -11.544523239135742, -11.019699096679688, -10.494874954223633, -9.970050811767578, -9.445226669311523, -8.920403480529785, -8.39557933807373, -7.870755195617676, -7.345931053161621, -6.821106910705566, -6.296282768249512, -5.771459102630615, -5.2466349601745605, -4.721810817718506, -4.196986675262451, -3.6721625328063965, -3.147338628768921, -2.622514486312866, -2.0976903438568115, -1.572866439819336, -1.0480422973632812, -0.5232181549072266, 0.0016059279441833496, 0.5264300107955933, 1.0512540340423584, 1.576078176498413, 2.1009023189544678, 2.6257262229919434, 3.150550365447998, 3.6753745079040527, 4.200198650360107, 4.725022792816162, 5.249846458435059, 5.774670600891113, 6.299494743347168, 6.824318885803223, 7.349143028259277, 7.873967170715332, 8.398791313171387, 8.923615455627441, 9.448439598083496, 9.97326374053955, 10.498087882995605, 11.022911071777344, 11.547735214233398, 12.072559356689453, 12.597383499145508, 13.122207641601562, 13.647031784057617, 14.171855926513672, 14.696680068969727, 15.221504211425781, 15.746328353881836, 16.27115249633789]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 10.0, 4.0, 8.0, 16.0, 32.0, 47.0, 65.0, 108.0, 177.0, 273.0, 403.0, 673.0, 1109.0, 1681.0, 2724.0, 4263.0, 6493.0, 10347.0, 15541.0, 23081.0, 32985.0, 45565.0, 60859.0, 76986.0, 91210.0, 101524.0, 104597.0, 101134.0, 90297.0, 75833.0, 59301.0, 44277.0, 32369.0, 22118.0, 14791.0, 9981.0, 6481.0, 4103.0, 2647.0, 1665.0, 1031.0, 629.0, 440.0, 274.0, 147.0, 110.0, 61.0, 35.0, 25.0, 20.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.7265625, -12.33447265625, -11.9423828125, -11.55029296875, -11.158203125, -10.76611328125, -10.3740234375, -9.98193359375, -9.58984375, -9.19775390625, -8.8056640625, -8.41357421875, -8.021484375, -7.62939453125, -7.2373046875, -6.84521484375, -6.453125, -6.06103515625, -5.6689453125, -5.27685546875, -4.884765625, -4.49267578125, -4.1005859375, -3.70849609375, -3.31640625, -2.92431640625, -2.5322265625, -2.14013671875, -1.748046875, -1.35595703125, -0.9638671875, -0.57177734375, -0.1796875, 0.21240234375, 0.6044921875, 0.99658203125, 1.388671875, 1.78076171875, 2.1728515625, 2.56494140625, 2.95703125, 3.34912109375, 3.7412109375, 4.13330078125, 4.525390625, 4.91748046875, 5.3095703125, 5.70166015625, 6.09375, 6.48583984375, 6.8779296875, 7.27001953125, 7.662109375, 8.05419921875, 8.4462890625, 8.83837890625, 9.23046875, 9.62255859375, 10.0146484375, 10.40673828125, 10.798828125, 11.19091796875, 11.5830078125, 11.97509765625, 12.3671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 10.0, 5.0, 5.0, 6.0, 9.0, 16.0, 13.0, 13.0, 20.0, 35.0, 27.0, 22.0, 30.0, 40.0, 36.0, 42.0, 39.0, 39.0, 50.0, 39.0, 61.0, 37.0, 31.0, 46.0, 32.0, 33.0, 43.0, 32.0, 21.0, 36.0, 17.0, 18.0, 23.0, 16.0, 16.0, 10.0, 5.0, 9.0, 3.0, 5.0, 5.0, 8.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.765625, -16.2591552734375, -15.752685546875, -15.2462158203125, -14.73974609375, -14.2332763671875, -13.726806640625, -13.2203369140625, -12.7138671875, -12.2073974609375, -11.700927734375, -11.1944580078125, -10.68798828125, -10.1815185546875, -9.675048828125, -9.1685791015625, -8.662109375, -8.1556396484375, -7.649169921875, -7.1427001953125, -6.63623046875, -6.1297607421875, -5.623291015625, -5.1168212890625, -4.6103515625, -4.1038818359375, -3.597412109375, -3.0909423828125, -2.58447265625, -2.0780029296875, -1.571533203125, -1.0650634765625, -0.55859375, -0.0521240234375, 0.454345703125, 0.9608154296875, 1.46728515625, 1.9737548828125, 2.480224609375, 2.9866943359375, 3.4931640625, 3.9996337890625, 4.506103515625, 5.0125732421875, 5.51904296875, 6.0255126953125, 6.531982421875, 7.0384521484375, 7.544921875, 8.0513916015625, 8.557861328125, 9.0643310546875, 9.57080078125, 10.0772705078125, 10.583740234375, 11.0902099609375, 11.5966796875, 12.1031494140625, 12.609619140625, 13.1160888671875, 13.62255859375, 14.1290283203125, 14.635498046875, 15.1419677734375, 15.6484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 16.0, 31.0, 55.0, 92.0, 147.0, 258.0, 519.0, 1025.0, 1864.0, 3577.0, 6802.0, 12711.0, 22577.0, 39512.0, 63975.0, 96170.0, 128977.0, 150056.0, 149019.0, 126711.0, 94659.0, 62958.0, 38317.0, 22321.0, 12242.0, 6514.0, 3494.0, 1870.0, 1004.0, 508.0, 253.0, 142.0, 80.0, 37.0, 28.0, 14.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.251708984375, -14.70654296875, -14.161376953125, -13.6162109375, -13.071044921875, -12.52587890625, -11.980712890625, -11.435546875, -10.890380859375, -10.34521484375, -9.800048828125, -9.2548828125, -8.709716796875, -8.16455078125, -7.619384765625, -7.07421875, -6.529052734375, -5.98388671875, -5.438720703125, -4.8935546875, -4.348388671875, -3.80322265625, -3.258056640625, -2.712890625, -2.167724609375, -1.62255859375, -1.077392578125, -0.5322265625, 0.012939453125, 0.55810546875, 1.103271484375, 1.6484375, 2.193603515625, 2.73876953125, 3.283935546875, 3.8291015625, 4.374267578125, 4.91943359375, 5.464599609375, 6.009765625, 6.554931640625, 7.10009765625, 7.645263671875, 8.1904296875, 8.735595703125, 9.28076171875, 9.825927734375, 10.37109375, 10.916259765625, 11.46142578125, 12.006591796875, 12.5517578125, 13.096923828125, 13.64208984375, 14.187255859375, 14.732421875, 15.277587890625, 15.82275390625, 16.367919921875, 16.9130859375, 17.458251953125, 18.00341796875, 18.548583984375, 19.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 5.0, 12.0, 10.0, 13.0, 24.0, 11.0, 17.0, 25.0, 26.0, 34.0, 31.0, 20.0, 39.0, 42.0, 41.0, 50.0, 40.0, 47.0, 34.0, 36.0, 42.0, 35.0, 54.0, 40.0, 44.0, 30.0, 34.0, 27.0, 21.0, 20.0, 16.0, 12.0, 18.0, 9.0, 6.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.2828369140625, -9.940673828125, -9.5985107421875, -9.25634765625, -8.9141845703125, -8.572021484375, -8.2298583984375, -7.8876953125, -7.5455322265625, -7.203369140625, -6.8612060546875, -6.51904296875, -6.1768798828125, -5.834716796875, -5.4925537109375, -5.150390625, -4.8082275390625, -4.466064453125, -4.1239013671875, -3.78173828125, -3.4395751953125, -3.097412109375, -2.7552490234375, -2.4130859375, -2.0709228515625, -1.728759765625, -1.3865966796875, -1.04443359375, -0.7022705078125, -0.360107421875, -0.0179443359375, 0.32421875, 0.6663818359375, 1.008544921875, 1.3507080078125, 1.69287109375, 2.0350341796875, 2.377197265625, 2.7193603515625, 3.0615234375, 3.4036865234375, 3.745849609375, 4.0880126953125, 4.43017578125, 4.7723388671875, 5.114501953125, 5.4566650390625, 5.798828125, 6.1409912109375, 6.483154296875, 6.8253173828125, 7.16748046875, 7.5096435546875, 7.851806640625, 8.1939697265625, 8.5361328125, 8.8782958984375, 9.220458984375, 9.5626220703125, 9.90478515625, 10.2469482421875, 10.589111328125, 10.9312744140625, 11.2734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 13.0, 12.0, 28.0, 36.0, 57.0, 76.0, 100.0, 141.0, 285.0, 436.0, 745.0, 1218.0, 2156.0, 3843.0, 6685.0, 11823.0, 20256.0, 35324.0, 57684.0, 88717.0, 122100.0, 147469.0, 151530.0, 132030.0, 100050.0, 67168.0, 41480.0, 24354.0, 14052.0, 7805.0, 4478.0, 2579.0, 1489.0, 880.0, 498.0, 357.0, 205.0, 136.0, 71.0, 60.0, 39.0, 19.0, 20.0, 8.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.01953125, -5.82635498046875, -5.6331787109375, -5.44000244140625, -5.246826171875, -5.05364990234375, -4.8604736328125, -4.66729736328125, -4.47412109375, -4.28094482421875, -4.0877685546875, -3.89459228515625, -3.701416015625, -3.50823974609375, -3.3150634765625, -3.12188720703125, -2.9287109375, -2.73553466796875, -2.5423583984375, -2.34918212890625, -2.156005859375, -1.96282958984375, -1.7696533203125, -1.57647705078125, -1.38330078125, -1.19012451171875, -0.9969482421875, -0.80377197265625, -0.610595703125, -0.41741943359375, -0.2242431640625, -0.03106689453125, 0.162109375, 0.35528564453125, 0.5484619140625, 0.74163818359375, 0.934814453125, 1.12799072265625, 1.3211669921875, 1.51434326171875, 1.70751953125, 1.90069580078125, 2.0938720703125, 2.28704833984375, 2.480224609375, 2.67340087890625, 2.8665771484375, 3.05975341796875, 3.2529296875, 3.44610595703125, 3.6392822265625, 3.83245849609375, 4.025634765625, 4.21881103515625, 4.4119873046875, 4.60516357421875, 4.79833984375, 4.99151611328125, 5.1846923828125, 5.37786865234375, 5.571044921875, 5.76422119140625, 5.9573974609375, 6.15057373046875, 6.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 7.0, 8.0, 6.0, 11.0, 9.0, 6.0, 21.0, 11.0, 31.0, 20.0, 34.0, 47.0, 45.0, 69.0, 47.0, 72.0, 54.0, 54.0, 55.0, 61.0, 58.0, 56.0, 42.0, 42.0, 24.0, 24.0, 20.0, 18.0, 12.0, 9.0, 8.0, 3.0, 5.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007561147212982178, -0.0007340312004089355, -0.0007119476795196533, -0.0006898641586303711, -0.0006677806377410889, -0.0006456971168518066, -0.0006236135959625244, -0.0006015300750732422, -0.00057944655418396, -0.0005573630332946777, -0.0005352795124053955, -0.0005131959915161133, -0.0004911124706268311, -0.00046902894973754883, -0.0004469454288482666, -0.0004248619079589844, -0.00040277838706970215, -0.0003806948661804199, -0.0003586113452911377, -0.00033652782440185547, -0.00031444430351257324, -0.000292360782623291, -0.0002702772617340088, -0.00024819374084472656, -0.00022611021995544434, -0.0002040266990661621, -0.00018194317817687988, -0.00015985965728759766, -0.00013777613639831543, -0.0001156926155090332, -9.360909461975098e-05, -7.152557373046875e-05, -4.9442052841186523e-05, -2.7358531951904297e-05, -5.27501106262207e-06, 1.6808509826660156e-05, 3.889203071594238e-05, 6.097555160522461e-05, 8.305907249450684e-05, 0.00010514259338378906, 0.0001272261142730713, 0.00014930963516235352, 0.00017139315605163574, 0.00019347667694091797, 0.0002155601978302002, 0.00023764371871948242, 0.00025972723960876465, 0.0002818107604980469, 0.0003038942813873291, 0.00032597780227661133, 0.00034806132316589355, 0.0003701448440551758, 0.000392228364944458, 0.00041431188583374023, 0.00043639540672302246, 0.0004584789276123047, 0.0004805624485015869, 0.0005026459693908691, 0.0005247294902801514, 0.0005468130111694336, 0.0005688965320587158, 0.000590980052947998, 0.0006130635738372803, 0.0006351470947265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 4.0, 3.0, 15.0, 15.0, 13.0, 31.0, 36.0, 42.0, 74.0, 104.0, 156.0, 205.0, 329.0, 450.0, 678.0, 1019.0, 1514.0, 2379.0, 3671.0, 5821.0, 9094.0, 14178.0, 23112.0, 35815.0, 55178.0, 79558.0, 106460.0, 127471.0, 135449.0, 124833.0, 102054.0, 75619.0, 51336.0, 33402.0, 21075.0, 13504.0, 8517.0, 5223.0, 3529.0, 2118.0, 1445.0, 998.0, 650.0, 432.0, 305.0, 212.0, 121.0, 102.0, 72.0, 47.0, 31.0, 20.0, 20.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.125, -5.9300537109375, -5.735107421875, -5.5401611328125, -5.34521484375, -5.1502685546875, -4.955322265625, -4.7603759765625, -4.5654296875, -4.3704833984375, -4.175537109375, -3.9805908203125, -3.78564453125, -3.5906982421875, -3.395751953125, -3.2008056640625, -3.005859375, -2.8109130859375, -2.615966796875, -2.4210205078125, -2.22607421875, -2.0311279296875, -1.836181640625, -1.6412353515625, -1.4462890625, -1.2513427734375, -1.056396484375, -0.8614501953125, -0.66650390625, -0.4715576171875, -0.276611328125, -0.0816650390625, 0.11328125, 0.3082275390625, 0.503173828125, 0.6981201171875, 0.89306640625, 1.0880126953125, 1.282958984375, 1.4779052734375, 1.6728515625, 1.8677978515625, 2.062744140625, 2.2576904296875, 2.45263671875, 2.6475830078125, 2.842529296875, 3.0374755859375, 3.232421875, 3.4273681640625, 3.622314453125, 3.8172607421875, 4.01220703125, 4.2071533203125, 4.402099609375, 4.5970458984375, 4.7919921875, 4.9869384765625, 5.181884765625, 5.3768310546875, 5.57177734375, 5.7667236328125, 5.961669921875, 6.1566162109375, 6.3515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 4.0, 5.0, 5.0, 2.0, 8.0, 6.0, 13.0, 4.0, 19.0, 31.0, 25.0, 38.0, 30.0, 35.0, 41.0, 59.0, 46.0, 52.0, 60.0, 68.0, 51.0, 58.0, 46.0, 47.0, 45.0, 31.0, 28.0, 29.0, 25.0, 18.0, 18.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.839447021484375, -2.74530029296875, -2.651153564453125, -2.5570068359375, -2.462860107421875, -2.36871337890625, -2.274566650390625, -2.180419921875, -2.086273193359375, -1.99212646484375, -1.897979736328125, -1.8038330078125, -1.709686279296875, -1.61553955078125, -1.521392822265625, -1.42724609375, -1.333099365234375, -1.23895263671875, -1.144805908203125, -1.0506591796875, -0.956512451171875, -0.86236572265625, -0.768218994140625, -0.674072265625, -0.579925537109375, -0.48577880859375, -0.391632080078125, -0.2974853515625, -0.203338623046875, -0.10919189453125, -0.015045166015625, 0.0791015625, 0.173248291015625, 0.26739501953125, 0.361541748046875, 0.4556884765625, 0.549835205078125, 0.64398193359375, 0.738128662109375, 0.832275390625, 0.926422119140625, 1.02056884765625, 1.114715576171875, 1.2088623046875, 1.303009033203125, 1.39715576171875, 1.491302490234375, 1.58544921875, 1.679595947265625, 1.77374267578125, 1.867889404296875, 1.9620361328125, 2.056182861328125, 2.15032958984375, 2.244476318359375, 2.338623046875, 2.432769775390625, 2.52691650390625, 2.621063232421875, 2.7152099609375, 2.809356689453125, 2.90350341796875, 2.997650146484375, 3.091796875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 12.0, 13.0, 17.0, 24.0, 24.0, 34.0, 40.0, 49.0, 49.0, 48.0, 64.0, 62.0, 50.0, 51.0, 62.0, 41.0, 55.0, 46.0, 35.0, 57.0, 25.0, 23.0, 15.0, 17.0, 15.0, 17.0, 9.0, 6.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09556770324707, -18.480003356933594, -17.864437103271484, -17.248872756958008, -16.6333065032959, -16.017742156982422, -15.402176856994629, -14.786611557006836, -14.171046257019043, -13.55548095703125, -12.939915657043457, -12.324350357055664, -11.708786010742188, -11.093219757080078, -10.477655410766602, -9.862090110778809, -9.246524810791016, -8.630959510803223, -8.01539421081543, -7.399829387664795, -6.784264087677002, -6.168698787689209, -5.553133964538574, -4.937568664550781, -4.322003364562988, -3.7064380645751953, -3.0908730030059814, -2.4753079414367676, -1.8597426414489746, -1.2441773414611816, -0.6286122798919678, -0.013047218322753906, 0.6025161743164062, 1.2180813550949097, 1.833646535873413, 2.449211597442627, 3.06477689743042, 3.680342197418213, 4.295907020568848, 4.911472320556641, 5.527037620544434, 6.142602920532227, 6.7581682205200195, 7.373733043670654, 7.989298343658447, 8.604864120483398, 9.220428466796875, 9.835993766784668, 10.451559066772461, 11.067124366760254, 11.682689666748047, 12.29825496673584, 12.913820266723633, 13.52938461303711, 14.144949913024902, 14.760515213012695, 15.376080513000488, 15.991645812988281, 16.607210159301758, 17.222776412963867, 17.838340759277344, 18.453907012939453, 19.06947135925293, 19.685035705566406, 20.300601959228516]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 10.0, 15.0, 11.0, 10.0, 18.0, 25.0, 21.0, 20.0, 28.0, 22.0, 36.0, 32.0, 29.0, 43.0, 32.0, 39.0, 41.0, 27.0, 35.0, 43.0, 36.0, 36.0, 42.0, 29.0, 29.0, 29.0, 30.0, 19.0, 23.0, 23.0, 19.0, 21.0, 18.0, 14.0, 13.0, 10.0, 10.0, 6.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.203418731689453, -13.735404014587402, -13.267388343811035, -12.799373626708984, -12.331357955932617, -11.863343238830566, -11.395328521728516, -10.927312850952148, -10.459298133850098, -9.991283416748047, -9.52326774597168, -9.055253028869629, -8.587238311767578, -8.119222640991211, -7.65120792388916, -7.183192729949951, -6.715177536010742, -6.247162342071533, -5.779147148132324, -5.311132431030273, -4.8431172370910645, -4.3751020431518555, -3.9070870876312256, -3.4390721321105957, -2.9710569381713867, -2.5030417442321777, -2.035026788711548, -1.5670117139816284, -1.098996639251709, -0.6309814453125, -0.16296648979187012, 0.30504846572875977, 0.7730636596679688, 1.2410787343978882, 1.7090938091278076, 2.1771087646484375, 2.6451239585876465, 3.1131391525268555, 3.5811541080474854, 4.049169063568115, 4.517184257507324, 4.985199451446533, 5.453214645385742, 5.921229362487793, 6.389244556427002, 6.857259750366211, 7.325274467468262, 7.793289661407471, 8.26130485534668, 8.72931957244873, 9.197335243225098, 9.665349960327148, 10.133365631103516, 10.601380348205566, 11.069395065307617, 11.537410736083984, 12.005425453186035, 12.473440170288086, 12.941455841064453, 13.409470558166504, 13.877485275268555, 14.345500946044922, 14.813515663146973, 15.281530380249023, 15.74954605102539]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 8.0, 14.0, 28.0, 27.0, 53.0, 73.0, 106.0, 210.0, 282.0, 450.0, 736.0, 1243.0, 1952.0, 3126.0, 5145.0, 8704.0, 14289.0, 24278.0, 41046.0, 69269.0, 117538.0, 191491.0, 299084.0, 427131.0, 542616.0, 596287.0, 557862.0, 448609.0, 317390.0, 207205.0, 127400.0, 77197.0, 45880.0, 26935.0, 16017.0, 9556.0, 5849.0, 3513.0, 2126.0, 1363.0, 809.0, 548.0, 313.0, 181.0, 114.0, 80.0, 58.0, 33.0, 22.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-16.015625, -15.524169921875, -15.03271484375, -14.541259765625, -14.0498046875, -13.558349609375, -13.06689453125, -12.575439453125, -12.083984375, -11.592529296875, -11.10107421875, -10.609619140625, -10.1181640625, -9.626708984375, -9.13525390625, -8.643798828125, -8.15234375, -7.660888671875, -7.16943359375, -6.677978515625, -6.1865234375, -5.695068359375, -5.20361328125, -4.712158203125, -4.220703125, -3.729248046875, -3.23779296875, -2.746337890625, -2.2548828125, -1.763427734375, -1.27197265625, -0.780517578125, -0.2890625, 0.202392578125, 0.69384765625, 1.185302734375, 1.6767578125, 2.168212890625, 2.65966796875, 3.151123046875, 3.642578125, 4.134033203125, 4.62548828125, 5.116943359375, 5.6083984375, 6.099853515625, 6.59130859375, 7.082763671875, 7.57421875, 8.065673828125, 8.55712890625, 9.048583984375, 9.5400390625, 10.031494140625, 10.52294921875, 11.014404296875, 11.505859375, 11.997314453125, 12.48876953125, 12.980224609375, 13.4716796875, 13.963134765625, 14.45458984375, 14.946044921875, 15.4375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 3.0, 13.0, 9.0, 10.0, 13.0, 14.0, 24.0, 23.0, 20.0, 24.0, 31.0, 23.0, 33.0, 38.0, 38.0, 33.0, 35.0, 39.0, 38.0, 34.0, 36.0, 31.0, 40.0, 44.0, 33.0, 27.0, 27.0, 28.0, 26.0, 19.0, 23.0, 20.0, 21.0, 22.0, 13.0, 10.0, 15.0, 10.0, 6.0, 8.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.75, -12.334716796875, -11.91943359375, -11.504150390625, -11.0888671875, -10.673583984375, -10.25830078125, -9.843017578125, -9.427734375, -9.012451171875, -8.59716796875, -8.181884765625, -7.7666015625, -7.351318359375, -6.93603515625, -6.520751953125, -6.10546875, -5.690185546875, -5.27490234375, -4.859619140625, -4.4443359375, -4.029052734375, -3.61376953125, -3.198486328125, -2.783203125, -2.367919921875, -1.95263671875, -1.537353515625, -1.1220703125, -0.706787109375, -0.29150390625, 0.123779296875, 0.5390625, 0.954345703125, 1.36962890625, 1.784912109375, 2.2001953125, 2.615478515625, 3.03076171875, 3.446044921875, 3.861328125, 4.276611328125, 4.69189453125, 5.107177734375, 5.5224609375, 5.937744140625, 6.35302734375, 6.768310546875, 7.18359375, 7.598876953125, 8.01416015625, 8.429443359375, 8.8447265625, 9.260009765625, 9.67529296875, 10.090576171875, 10.505859375, 10.921142578125, 11.33642578125, 11.751708984375, 12.1669921875, 12.582275390625, 12.99755859375, 13.412841796875, 13.828125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 13.0, 15.0, 22.0, 44.0, 91.0, 129.0, 246.0, 376.0, 653.0, 1059.0, 1881.0, 3268.0, 5362.0, 9268.0, 16175.0, 27553.0, 48146.0, 81080.0, 134173.0, 213468.0, 319194.0, 437550.0, 532559.0, 570728.0, 527823.0, 428788.0, 310163.0, 207141.0, 130008.0, 77826.0, 46000.0, 26556.0, 15427.0, 8936.0, 5089.0, 3077.0, 1787.0, 1087.0, 622.0, 374.0, 213.0, 132.0, 84.0, 41.0, 30.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.984375, -16.461181640625, -15.93798828125, -15.414794921875, -14.8916015625, -14.368408203125, -13.84521484375, -13.322021484375, -12.798828125, -12.275634765625, -11.75244140625, -11.229248046875, -10.7060546875, -10.182861328125, -9.65966796875, -9.136474609375, -8.61328125, -8.090087890625, -7.56689453125, -7.043701171875, -6.5205078125, -5.997314453125, -5.47412109375, -4.950927734375, -4.427734375, -3.904541015625, -3.38134765625, -2.858154296875, -2.3349609375, -1.811767578125, -1.28857421875, -0.765380859375, -0.2421875, 0.281005859375, 0.80419921875, 1.327392578125, 1.8505859375, 2.373779296875, 2.89697265625, 3.420166015625, 3.943359375, 4.466552734375, 4.98974609375, 5.512939453125, 6.0361328125, 6.559326171875, 7.08251953125, 7.605712890625, 8.12890625, 8.652099609375, 9.17529296875, 9.698486328125, 10.2216796875, 10.744873046875, 11.26806640625, 11.791259765625, 12.314453125, 12.837646484375, 13.36083984375, 13.884033203125, 14.4072265625, 14.930419921875, 15.45361328125, 15.976806640625, 16.5]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 14.0, 16.0, 15.0, 27.0, 24.0, 39.0, 47.0, 51.0, 64.0, 85.0, 118.0, 123.0, 131.0, 140.0, 171.0, 201.0, 198.0, 218.0, 205.0, 202.0, 205.0, 189.0, 178.0, 178.0, 175.0, 162.0, 134.0, 129.0, 110.0, 97.0, 95.0, 50.0, 50.0, 42.0, 30.0, 37.0, 25.0, 22.0, 17.0, 18.0, 7.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-6.72265625, -6.51177978515625, -6.3009033203125, -6.09002685546875, -5.879150390625, -5.66827392578125, -5.4573974609375, -5.24652099609375, -5.03564453125, -4.82476806640625, -4.6138916015625, -4.40301513671875, -4.192138671875, -3.98126220703125, -3.7703857421875, -3.55950927734375, -3.3486328125, -3.13775634765625, -2.9268798828125, -2.71600341796875, -2.505126953125, -2.29425048828125, -2.0833740234375, -1.87249755859375, -1.66162109375, -1.45074462890625, -1.2398681640625, -1.02899169921875, -0.818115234375, -0.60723876953125, -0.3963623046875, -0.18548583984375, 0.025390625, 0.23626708984375, 0.4471435546875, 0.65802001953125, 0.868896484375, 1.07977294921875, 1.2906494140625, 1.50152587890625, 1.71240234375, 1.92327880859375, 2.1341552734375, 2.34503173828125, 2.555908203125, 2.76678466796875, 2.9776611328125, 3.18853759765625, 3.3994140625, 3.61029052734375, 3.8211669921875, 4.03204345703125, 4.242919921875, 4.45379638671875, 4.6646728515625, 4.87554931640625, 5.08642578125, 5.29730224609375, 5.5081787109375, 5.71905517578125, 5.929931640625, 6.14080810546875, 6.3516845703125, 6.56256103515625, 6.7734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 12.0, 13.0, 14.0, 10.0, 18.0, 42.0, 28.0, 39.0, 33.0, 49.0, 54.0, 32.0, 33.0, 40.0, 46.0, 45.0, 61.0, 50.0, 49.0, 45.0, 29.0, 36.0, 30.0, 29.0, 31.0, 33.0, 11.0, 13.0, 13.0, 7.0, 5.0, 8.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.272865295410156, -16.7117977142334, -16.150728225708008, -15.589659690856934, -15.02859115600586, -14.467523574829102, -13.906455039978027, -13.345386505126953, -12.784317970275879, -12.223249435424805, -11.66218090057373, -11.101112365722656, -10.540044784545898, -9.978975296020508, -9.41790771484375, -8.856839179992676, -8.295770645141602, -7.734702110290527, -7.173633575439453, -6.612565517425537, -6.051496982574463, -5.490428447723389, -4.929360389709473, -4.368291854858398, -3.807223320007324, -3.24615478515625, -2.685086488723755, -2.1240181922912598, -1.5629496574401855, -1.0018811225891113, -0.4408128261566162, 0.1202554702758789, 0.6813240051269531, 1.2423924207687378, 1.8034608364105225, 2.3645291328430176, 2.925597667694092, 3.486666202545166, 4.047734260559082, 4.608802795410156, 5.1698713302612305, 5.730939865112305, 6.292008399963379, 6.853076457977295, 7.414144992828369, 7.975213527679443, 8.53628158569336, 9.097350120544434, 9.658418655395508, 10.219487190246582, 10.780555725097656, 11.34162425994873, 11.902692794799805, 12.463760375976562, 13.024828910827637, 13.585897445678711, 14.146965980529785, 14.70803451538086, 15.269103050231934, 15.830171585083008, 16.391239166259766, 16.952308654785156, 17.513376235961914, 18.074443817138672, 18.635513305664062]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 5.0, 4.0, 7.0, 11.0, 7.0, 11.0, 18.0, 18.0, 10.0, 26.0, 19.0, 28.0, 20.0, 27.0, 26.0, 35.0, 34.0, 20.0, 36.0, 33.0, 36.0, 42.0, 35.0, 40.0, 30.0, 50.0, 32.0, 35.0, 29.0, 33.0, 26.0, 25.0, 18.0, 18.0, 16.0, 18.0, 22.0, 19.0, 11.0, 8.0, 6.0, 7.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.895451545715332, -12.44568920135498, -11.995927810668945, -11.546165466308594, -11.096403121948242, -10.64664077758789, -10.196878433227539, -9.747117042541504, -9.297354698181152, -8.8475923538208, -8.397830963134766, -7.948068618774414, -7.4983062744140625, -7.048543930053711, -6.598782062530518, -6.149020195007324, -5.699257850646973, -5.249495506286621, -4.799733638763428, -4.349971771240234, -3.900209426879883, -3.4504473209381104, -3.000685214996338, -2.5509231090545654, -2.101161003112793, -1.6513988971710205, -1.201636791229248, -0.7518746852874756, -0.3021125793457031, 0.14764952659606934, 0.5974116325378418, 1.0471737384796143, 1.4969358444213867, 1.9466979503631592, 2.3964600563049316, 2.846222162246704, 3.2959842681884766, 3.745746374130249, 4.1955084800720215, 4.645270347595215, 5.095032691955566, 5.544795036315918, 5.994556903839111, 6.444318771362305, 6.894081115722656, 7.343843460083008, 7.793605327606201, 8.243367195129395, 8.693129539489746, 9.142891883850098, 9.592653274536133, 10.042415618896484, 10.492177963256836, 10.941940307617188, 11.391702651977539, 11.841464042663574, 12.291226387023926, 12.740988731384277, 13.190750122070312, 13.640512466430664, 14.090274810791016, 14.540037155151367, 14.989799499511719, 15.439560890197754, 15.889323234558105]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 20.0, 20.0, 39.0, 42.0, 47.0, 104.0, 141.0, 202.0, 272.0, 473.0, 793.0, 1179.0, 1807.0, 2805.0, 4568.0, 6996.0, 11248.0, 17756.0, 27522.0, 41374.0, 60863.0, 84767.0, 108599.0, 126322.0, 129429.0, 116986.0, 94449.0, 70153.0, 48982.0, 32575.0, 21302.0, 13339.0, 8534.0, 5392.0, 3432.0, 2138.0, 1334.0, 835.0, 592.0, 356.0, 280.0, 167.0, 101.0, 66.0, 64.0, 33.0, 19.0, 10.0, 7.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0], "bins": [-3.126953125, -3.02984619140625, -2.9327392578125, -2.83563232421875, -2.738525390625, -2.64141845703125, -2.5443115234375, -2.44720458984375, -2.35009765625, -2.25299072265625, -2.1558837890625, -2.05877685546875, -1.961669921875, -1.86456298828125, -1.7674560546875, -1.67034912109375, -1.5732421875, -1.47613525390625, -1.3790283203125, -1.28192138671875, -1.184814453125, -1.08770751953125, -0.9906005859375, -0.89349365234375, -0.79638671875, -0.69927978515625, -0.6021728515625, -0.50506591796875, -0.407958984375, -0.31085205078125, -0.2137451171875, -0.11663818359375, -0.01953125, 0.07757568359375, 0.1746826171875, 0.27178955078125, 0.368896484375, 0.46600341796875, 0.5631103515625, 0.66021728515625, 0.75732421875, 0.85443115234375, 0.9515380859375, 1.04864501953125, 1.145751953125, 1.24285888671875, 1.3399658203125, 1.43707275390625, 1.5341796875, 1.63128662109375, 1.7283935546875, 1.82550048828125, 1.922607421875, 2.01971435546875, 2.1168212890625, 2.21392822265625, 2.31103515625, 2.40814208984375, 2.5052490234375, 2.60235595703125, 2.699462890625, 2.79656982421875, 2.8936767578125, 2.99078369140625, 3.087890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 4.0, 7.0, 11.0, 7.0, 12.0, 15.0, 18.0, 13.0, 24.0, 20.0, 26.0, 21.0, 26.0, 28.0, 35.0, 33.0, 20.0, 36.0, 35.0, 34.0, 40.0, 39.0, 37.0, 30.0, 49.0, 32.0, 37.0, 28.0, 35.0, 24.0, 24.0, 19.0, 17.0, 19.0, 17.0, 21.0, 20.0, 11.0, 8.0, 6.0, 8.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.921875, -12.472412109375, -12.02294921875, -11.573486328125, -11.1240234375, -10.674560546875, -10.22509765625, -9.775634765625, -9.326171875, -8.876708984375, -8.42724609375, -7.977783203125, -7.5283203125, -7.078857421875, -6.62939453125, -6.179931640625, -5.73046875, -5.281005859375, -4.83154296875, -4.382080078125, -3.9326171875, -3.483154296875, -3.03369140625, -2.584228515625, -2.134765625, -1.685302734375, -1.23583984375, -0.786376953125, -0.3369140625, 0.112548828125, 0.56201171875, 1.011474609375, 1.4609375, 1.910400390625, 2.35986328125, 2.809326171875, 3.2587890625, 3.708251953125, 4.15771484375, 4.607177734375, 5.056640625, 5.506103515625, 5.95556640625, 6.405029296875, 6.8544921875, 7.303955078125, 7.75341796875, 8.202880859375, 8.65234375, 9.101806640625, 9.55126953125, 10.000732421875, 10.4501953125, 10.899658203125, 11.34912109375, 11.798583984375, 12.248046875, 12.697509765625, 13.14697265625, 13.596435546875, 14.0458984375, 14.495361328125, 14.94482421875, 15.394287109375, 15.84375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 13.0, 18.0, 27.0, 37.0, 38.0, 69.0, 77.0, 101.0, 141.0, 208.0, 261.0, 377.0, 528.0, 799.0, 1078.0, 1580.0, 2416.0, 3655.0, 5650.0, 8871.0, 14135.0, 24272.0, 75351.0, 796897.0, 52675.0, 22014.0, 13097.0, 8026.0, 5399.0, 3418.0, 2207.0, 1511.0, 1009.0, 748.0, 543.0, 369.0, 251.0, 186.0, 106.0, 107.0, 67.0, 52.0, 47.0, 26.0, 18.0, 11.0, 9.0, 10.0, 11.0, 3.0, 3.0, 4.0, 0.0, 7.0], "bins": [-7.92578125, -7.68865966796875, -7.4515380859375, -7.21441650390625, -6.977294921875, -6.74017333984375, -6.5030517578125, -6.26593017578125, -6.02880859375, -5.79168701171875, -5.5545654296875, -5.31744384765625, -5.080322265625, -4.84320068359375, -4.6060791015625, -4.36895751953125, -4.1318359375, -3.89471435546875, -3.6575927734375, -3.42047119140625, -3.183349609375, -2.94622802734375, -2.7091064453125, -2.47198486328125, -2.23486328125, -1.99774169921875, -1.7606201171875, -1.52349853515625, -1.286376953125, -1.04925537109375, -0.8121337890625, -0.57501220703125, -0.337890625, -0.10076904296875, 0.1363525390625, 0.37347412109375, 0.610595703125, 0.84771728515625, 1.0848388671875, 1.32196044921875, 1.55908203125, 1.79620361328125, 2.0333251953125, 2.27044677734375, 2.507568359375, 2.74468994140625, 2.9818115234375, 3.21893310546875, 3.4560546875, 3.69317626953125, 3.9302978515625, 4.16741943359375, 4.404541015625, 4.64166259765625, 4.8787841796875, 5.11590576171875, 5.35302734375, 5.59014892578125, 5.8272705078125, 6.06439208984375, 6.301513671875, 6.53863525390625, 6.7757568359375, 7.01287841796875, 7.25]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 11.0, 10.0, 6.0, 7.0, 13.0, 16.0, 16.0, 16.0, 20.0, 11.0, 24.0, 30.0, 30.0, 22.0, 32.0, 38.0, 39.0, 33.0, 38.0, 40.0, 36.0, 37.0, 31.0, 44.0, 36.0, 30.0, 29.0, 39.0, 30.0, 23.0, 31.0, 29.0, 29.0, 23.0, 18.0, 5.0, 18.0, 8.0, 10.0, 14.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.7265625, -9.4117431640625, -9.096923828125, -8.7821044921875, -8.46728515625, -8.1524658203125, -7.837646484375, -7.5228271484375, -7.2080078125, -6.8931884765625, -6.578369140625, -6.2635498046875, -5.94873046875, -5.6339111328125, -5.319091796875, -5.0042724609375, -4.689453125, -4.3746337890625, -4.059814453125, -3.7449951171875, -3.43017578125, -3.1153564453125, -2.800537109375, -2.4857177734375, -2.1708984375, -1.8560791015625, -1.541259765625, -1.2264404296875, -0.91162109375, -0.5968017578125, -0.281982421875, 0.0328369140625, 0.34765625, 0.6624755859375, 0.977294921875, 1.2921142578125, 1.60693359375, 1.9217529296875, 2.236572265625, 2.5513916015625, 2.8662109375, 3.1810302734375, 3.495849609375, 3.8106689453125, 4.12548828125, 4.4403076171875, 4.755126953125, 5.0699462890625, 5.384765625, 5.6995849609375, 6.014404296875, 6.3292236328125, 6.64404296875, 6.9588623046875, 7.273681640625, 7.5885009765625, 7.9033203125, 8.2181396484375, 8.532958984375, 8.8477783203125, 9.16259765625, 9.4774169921875, 9.792236328125, 10.1070556640625, 10.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 4.0, 5.0, 6.0, 6.0, 11.0, 11.0, 11.0, 17.0, 35.0, 30.0, 59.0, 78.0, 124.0, 170.0, 319.0, 465.0, 937.0, 1696.0, 3268.0, 6606.0, 14242.0, 31773.0, 649725.0, 285342.0, 28345.0, 12666.0, 6079.0, 2882.0, 1545.0, 833.0, 458.0, 258.0, 188.0, 99.0, 82.0, 58.0, 36.0, 26.0, 14.0, 12.0, 6.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92578125, -0.89678955078125, -0.8677978515625, -0.83880615234375, -0.809814453125, -0.78082275390625, -0.7518310546875, -0.72283935546875, -0.69384765625, -0.66485595703125, -0.6358642578125, -0.60687255859375, -0.577880859375, -0.54888916015625, -0.5198974609375, -0.49090576171875, -0.4619140625, -0.43292236328125, -0.4039306640625, -0.37493896484375, -0.345947265625, -0.31695556640625, -0.2879638671875, -0.25897216796875, -0.22998046875, -0.20098876953125, -0.1719970703125, -0.14300537109375, -0.114013671875, -0.08502197265625, -0.0560302734375, -0.02703857421875, 0.001953125, 0.03094482421875, 0.0599365234375, 0.08892822265625, 0.117919921875, 0.14691162109375, 0.1759033203125, 0.20489501953125, 0.23388671875, 0.26287841796875, 0.2918701171875, 0.32086181640625, 0.349853515625, 0.37884521484375, 0.4078369140625, 0.43682861328125, 0.4658203125, 0.49481201171875, 0.5238037109375, 0.55279541015625, 0.581787109375, 0.61077880859375, 0.6397705078125, 0.66876220703125, 0.69775390625, 0.72674560546875, 0.7557373046875, 0.78472900390625, 0.813720703125, 0.84271240234375, 0.8717041015625, 0.90069580078125, 0.9296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 10.0, 4.0, 10.0, 13.0, 7.0, 9.0, 19.0, 25.0, 26.0, 28.0, 28.0, 28.0, 34.0, 33.0, 50.0, 58.0, 61.0, 51.0, 45.0, 50.0, 48.0, 53.0, 51.0, 50.0, 44.0, 33.0, 22.0, 9.0, 17.0, 24.0, 13.0, 12.0, 9.0, 3.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8848648071289062e-05, -2.7942471206188202e-05, -2.703629434108734e-05, -2.613011747598648e-05, -2.522394061088562e-05, -2.431776374578476e-05, -2.34115868806839e-05, -2.250541001558304e-05, -2.1599233150482178e-05, -2.0693056285381317e-05, -1.9786879420280457e-05, -1.8880702555179596e-05, -1.7974525690078735e-05, -1.7068348824977875e-05, -1.6162171959877014e-05, -1.5255995094776154e-05, -1.4349818229675293e-05, -1.3443641364574432e-05, -1.2537464499473572e-05, -1.1631287634372711e-05, -1.072511076927185e-05, -9.81893390417099e-06, -8.91275703907013e-06, -8.006580173969269e-06, -7.100403308868408e-06, -6.194226443767548e-06, -5.288049578666687e-06, -4.381872713565826e-06, -3.475695848464966e-06, -2.5695189833641052e-06, -1.6633421182632446e-06, -7.57165253162384e-07, 1.4901161193847656e-07, 1.0551884770393372e-06, 1.9613653421401978e-06, 2.8675422072410583e-06, 3.773719072341919e-06, 4.6798959374427795e-06, 5.58607280254364e-06, 6.492249667644501e-06, 7.398426532745361e-06, 8.304603397846222e-06, 9.210780262947083e-06, 1.0116957128047943e-05, 1.1023133993148804e-05, 1.1929310858249664e-05, 1.2835487723350525e-05, 1.3741664588451385e-05, 1.4647841453552246e-05, 1.5554018318653107e-05, 1.6460195183753967e-05, 1.7366372048854828e-05, 1.827254891395569e-05, 1.917872577905655e-05, 2.008490264415741e-05, 2.099107950925827e-05, 2.189725637435913e-05, 2.280343323945999e-05, 2.3709610104560852e-05, 2.4615786969661713e-05, 2.5521963834762573e-05, 2.6428140699863434e-05, 2.7334317564964294e-05, 2.8240494430065155e-05, 2.9146671295166016e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 13.0, 13.0, 22.0, 25.0, 53.0, 80.0, 137.0, 198.0, 290.0, 468.0, 790.0, 1369.0, 2345.0, 4294.0, 7787.0, 14303.0, 25426.0, 44379.0, 74290.0, 114112.0, 158934.0, 178150.0, 151468.0, 107899.0, 68614.0, 40947.0, 23310.0, 12769.0, 6855.0, 3878.0, 2176.0, 1242.0, 687.0, 407.0, 286.0, 173.0, 127.0, 79.0, 52.0, 31.0, 19.0, 19.0, 9.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7913665771484375, -0.765350341796875, -0.7393341064453125, -0.71331787109375, -0.6873016357421875, -0.661285400390625, -0.6352691650390625, -0.6092529296875, -0.5832366943359375, -0.557220458984375, -0.5312042236328125, -0.50518798828125, -0.4791717529296875, -0.453155517578125, -0.4271392822265625, -0.401123046875, -0.3751068115234375, -0.349090576171875, -0.3230743408203125, -0.29705810546875, -0.2710418701171875, -0.245025634765625, -0.2190093994140625, -0.1929931640625, -0.1669769287109375, -0.140960693359375, -0.1149444580078125, -0.08892822265625, -0.0629119873046875, -0.036895751953125, -0.0108795166015625, 0.01513671875, 0.0411529541015625, 0.067169189453125, 0.0931854248046875, 0.11920166015625, 0.1452178955078125, 0.171234130859375, 0.1972503662109375, 0.2232666015625, 0.2492828369140625, 0.275299072265625, 0.3013153076171875, 0.32733154296875, 0.3533477783203125, 0.379364013671875, 0.4053802490234375, 0.431396484375, 0.4574127197265625, 0.483428955078125, 0.5094451904296875, 0.53546142578125, 0.5614776611328125, 0.587493896484375, 0.6135101318359375, 0.6395263671875, 0.6655426025390625, 0.691558837890625, 0.7175750732421875, 0.74359130859375, 0.7696075439453125, 0.795623779296875, 0.8216400146484375, 0.84765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 13.0, 19.0, 21.0, 30.0, 40.0, 37.0, 48.0, 69.0, 81.0, 67.0, 67.0, 81.0, 87.0, 65.0, 60.0, 44.0, 25.0, 26.0, 22.0, 13.0, 16.0, 16.0, 3.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3221244812011719, -0.31075286865234375, -0.2993812561035156, -0.2880096435546875, -0.2766380310058594, -0.26526641845703125, -0.2538948059082031, -0.242523193359375, -0.23115158081054688, -0.21977996826171875, -0.20840835571289062, -0.1970367431640625, -0.18566513061523438, -0.17429351806640625, -0.16292190551757812, -0.15155029296875, -0.14017868041992188, -0.12880706787109375, -0.11743545532226562, -0.1060638427734375, -0.09469223022460938, -0.08332061767578125, -0.07194900512695312, -0.060577392578125, -0.049205780029296875, -0.03783416748046875, -0.026462554931640625, -0.0150909423828125, -0.003719329833984375, 0.00765228271484375, 0.019023895263671875, 0.0303955078125, 0.041767120361328125, 0.05313873291015625, 0.06451034545898438, 0.0758819580078125, 0.08725357055664062, 0.09862518310546875, 0.10999679565429688, 0.121368408203125, 0.13274002075195312, 0.14411163330078125, 0.15548324584960938, 0.1668548583984375, 0.17822647094726562, 0.18959808349609375, 0.20096969604492188, 0.21234130859375, 0.22371292114257812, 0.23508453369140625, 0.24645614624023438, 0.2578277587890625, 0.2691993713378906, 0.28057098388671875, 0.2919425964355469, 0.303314208984375, 0.3146858215332031, 0.32605743408203125, 0.3374290466308594, 0.3488006591796875, 0.3601722717285156, 0.37154388427734375, 0.3829154968261719, 0.394287109375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 9.0, 11.0, 11.0, 13.0, 14.0, 19.0, 37.0, 28.0, 31.0, 54.0, 41.0, 48.0, 31.0, 48.0, 23.0, 57.0, 40.0, 58.0, 58.0, 40.0, 47.0, 31.0, 37.0, 34.0, 29.0, 29.0, 35.0, 6.0, 14.0, 12.0, 8.0, 7.0, 4.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.43577003479004, -16.86945343017578, -16.303136825561523, -15.736820220947266, -15.170504570007324, -14.604187965393066, -14.037871360778809, -13.47155475616455, -12.90523910522461, -12.338922500610352, -11.772605895996094, -11.206289291381836, -10.639973640441895, -10.073657035827637, -9.507340431213379, -8.941023826599121, -8.374707221984863, -7.8083906173706055, -7.242074489593506, -6.675757884979248, -6.109441757202148, -5.543125152587891, -4.976808547973633, -4.410491943359375, -3.8441758155822754, -3.2778594493865967, -2.711543083190918, -2.14522647857666, -1.5789101123809814, -1.0125937461853027, -0.4462771415710449, 0.12003922462463379, 0.6863555908203125, 1.2526719570159912, 1.8189884424209595, 2.3853049278259277, 2.9516212940216064, 3.517937660217285, 4.084254264831543, 4.650570869445801, 5.2168869972229, 5.783203601837158, 6.349519729614258, 6.915836334228516, 7.482152938842773, 8.048469543457031, 8.614786148071289, 9.18110179901123, 9.747418403625488, 10.313735008239746, 10.880051612854004, 11.446367263793945, 12.012683868408203, 12.579000473022461, 13.145317077636719, 13.711633682250977, 14.277950286865234, 14.844266891479492, 15.41058349609375, 15.976900100708008, 16.543216705322266, 17.10953140258789, 17.67584991455078, 18.242164611816406, 18.808481216430664]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 7.0, 1.0, 7.0, 4.0, 6.0, 12.0, 6.0, 12.0, 14.0, 18.0, 15.0, 23.0, 20.0, 25.0, 20.0, 30.0, 18.0, 42.0, 30.0, 23.0, 37.0, 30.0, 37.0, 38.0, 40.0, 36.0, 30.0, 52.0, 33.0, 32.0, 32.0, 35.0, 24.0, 24.0, 21.0, 16.0, 15.0, 19.0, 24.0, 18.0, 9.0, 11.0, 4.0, 10.0, 12.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.966719627380371, -12.517382621765137, -12.068044662475586, -11.618707656860352, -11.169370651245117, -10.720033645629883, -10.270696640014648, -9.821358680725098, -9.372021675109863, -8.922684669494629, -8.473346710205078, -8.024009704589844, -7.574672698974609, -7.125335693359375, -6.675998210906982, -6.22666072845459, -5.7773237228393555, -5.327986717224121, -4.8786492347717285, -4.429311752319336, -3.9799747467041016, -3.530637502670288, -3.0813002586364746, -2.631963014602661, -2.1826257705688477, -1.7332885265350342, -1.2839512825012207, -0.8346140384674072, -0.38527679443359375, 0.06406044960021973, 0.5133976936340332, 0.9627349376678467, 1.4120721817016602, 1.8614094257354736, 2.310746669769287, 2.7600839138031006, 3.209421157836914, 3.6587584018707275, 4.108095645904541, 4.557433128356934, 5.006770133972168, 5.456107139587402, 5.905444622039795, 6.3547821044921875, 6.804119110107422, 7.253456115722656, 7.702793598175049, 8.152131080627441, 8.601468086242676, 9.05080509185791, 9.500143051147461, 9.949480056762695, 10.39881706237793, 10.848154067993164, 11.297491073608398, 11.74682903289795, 12.196166038513184, 12.645503044128418, 13.094841003417969, 13.544178009033203, 13.993515014648438, 14.442852020263672, 14.892189025878906, 15.341526985168457, 15.790863990783691]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 13.0, 14.0, 30.0, 39.0, 84.0, 140.0, 222.0, 441.0, 694.0, 1257.0, 2112.0, 3710.0, 5866.0, 9932.0, 15417.0, 23597.0, 35346.0, 50398.0, 68237.0, 86342.0, 102140.0, 111947.0, 112435.0, 103581.0, 87848.0, 70310.0, 52516.0, 36759.0, 25149.0, 16151.0, 10188.0, 6207.0, 3880.0, 2285.0, 1383.0, 828.0, 464.0, 268.0, 146.0, 79.0, 42.0, 25.0, 16.0, 10.0, 8.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.037353515625, -10.61376953125, -10.190185546875, -9.7666015625, -9.343017578125, -8.91943359375, -8.495849609375, -8.072265625, -7.648681640625, -7.22509765625, -6.801513671875, -6.3779296875, -5.954345703125, -5.53076171875, -5.107177734375, -4.68359375, -4.260009765625, -3.83642578125, -3.412841796875, -2.9892578125, -2.565673828125, -2.14208984375, -1.718505859375, -1.294921875, -0.871337890625, -0.44775390625, -0.024169921875, 0.3994140625, 0.822998046875, 1.24658203125, 1.670166015625, 2.09375, 2.517333984375, 2.94091796875, 3.364501953125, 3.7880859375, 4.211669921875, 4.63525390625, 5.058837890625, 5.482421875, 5.906005859375, 6.32958984375, 6.753173828125, 7.1767578125, 7.600341796875, 8.02392578125, 8.447509765625, 8.87109375, 9.294677734375, 9.71826171875, 10.141845703125, 10.5654296875, 10.989013671875, 11.41259765625, 11.836181640625, 12.259765625, 12.683349609375, 13.10693359375, 13.530517578125, 13.9541015625, 14.377685546875, 14.80126953125, 15.224853515625, 15.6484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 7.0, 5.0, 6.0, 10.0, 7.0, 8.0, 17.0, 18.0, 13.0, 28.0, 21.0, 20.0, 26.0, 24.0, 25.0, 35.0, 33.0, 24.0, 32.0, 35.0, 41.0, 30.0, 46.0, 35.0, 26.0, 50.0, 36.0, 38.0, 27.0, 35.0, 25.0, 23.0, 21.0, 19.0, 15.0, 22.0, 18.0, 16.0, 14.0, 7.0, 5.0, 9.0, 13.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.12646484375, -11.6904296875, -11.25439453125, -10.818359375, -10.38232421875, -9.9462890625, -9.51025390625, -9.07421875, -8.63818359375, -8.2021484375, -7.76611328125, -7.330078125, -6.89404296875, -6.4580078125, -6.02197265625, -5.5859375, -5.14990234375, -4.7138671875, -4.27783203125, -3.841796875, -3.40576171875, -2.9697265625, -2.53369140625, -2.09765625, -1.66162109375, -1.2255859375, -0.78955078125, -0.353515625, 0.08251953125, 0.5185546875, 0.95458984375, 1.390625, 1.82666015625, 2.2626953125, 2.69873046875, 3.134765625, 3.57080078125, 4.0068359375, 4.44287109375, 4.87890625, 5.31494140625, 5.7509765625, 6.18701171875, 6.623046875, 7.05908203125, 7.4951171875, 7.93115234375, 8.3671875, 8.80322265625, 9.2392578125, 9.67529296875, 10.111328125, 10.54736328125, 10.9833984375, 11.41943359375, 11.85546875, 12.29150390625, 12.7275390625, 13.16357421875, 13.599609375, 14.03564453125, 14.4716796875, 14.90771484375, 15.34375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 9.0, 6.0, 23.0, 25.0, 59.0, 79.0, 122.0, 216.0, 383.0, 581.0, 958.0, 1620.0, 2634.0, 4199.0, 6698.0, 10386.0, 16240.0, 24094.0, 34953.0, 48621.0, 64618.0, 81174.0, 96415.0, 106064.0, 108045.0, 101008.0, 88555.0, 72074.0, 56058.0, 40036.0, 28694.0, 19495.0, 12751.0, 8188.0, 5134.0, 3226.0, 1961.0, 1225.0, 745.0, 449.0, 293.0, 165.0, 101.0, 75.0, 44.0, 29.0, 12.0, 12.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.3515625, -12.96142578125, -12.5712890625, -12.18115234375, -11.791015625, -11.40087890625, -11.0107421875, -10.62060546875, -10.23046875, -9.84033203125, -9.4501953125, -9.06005859375, -8.669921875, -8.27978515625, -7.8896484375, -7.49951171875, -7.109375, -6.71923828125, -6.3291015625, -5.93896484375, -5.548828125, -5.15869140625, -4.7685546875, -4.37841796875, -3.98828125, -3.59814453125, -3.2080078125, -2.81787109375, -2.427734375, -2.03759765625, -1.6474609375, -1.25732421875, -0.8671875, -0.47705078125, -0.0869140625, 0.30322265625, 0.693359375, 1.08349609375, 1.4736328125, 1.86376953125, 2.25390625, 2.64404296875, 3.0341796875, 3.42431640625, 3.814453125, 4.20458984375, 4.5947265625, 4.98486328125, 5.375, 5.76513671875, 6.1552734375, 6.54541015625, 6.935546875, 7.32568359375, 7.7158203125, 8.10595703125, 8.49609375, 8.88623046875, 9.2763671875, 9.66650390625, 10.056640625, 10.44677734375, 10.8369140625, 11.22705078125, 11.6171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 10.0, 4.0, 9.0, 13.0, 15.0, 23.0, 27.0, 27.0, 15.0, 17.0, 22.0, 27.0, 26.0, 33.0, 35.0, 35.0, 42.0, 44.0, 31.0, 40.0, 26.0, 37.0, 31.0, 39.0, 41.0, 39.0, 18.0, 34.0, 32.0, 27.0, 27.0, 20.0, 15.0, 10.0, 15.0, 18.0, 15.0, 5.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.6953125, -9.3974609375, -9.099609375, -8.8017578125, -8.50390625, -8.2060546875, -7.908203125, -7.6103515625, -7.3125, -7.0146484375, -6.716796875, -6.4189453125, -6.12109375, -5.8232421875, -5.525390625, -5.2275390625, -4.9296875, -4.6318359375, -4.333984375, -4.0361328125, -3.73828125, -3.4404296875, -3.142578125, -2.8447265625, -2.546875, -2.2490234375, -1.951171875, -1.6533203125, -1.35546875, -1.0576171875, -0.759765625, -0.4619140625, -0.1640625, 0.1337890625, 0.431640625, 0.7294921875, 1.02734375, 1.3251953125, 1.623046875, 1.9208984375, 2.21875, 2.5166015625, 2.814453125, 3.1123046875, 3.41015625, 3.7080078125, 4.005859375, 4.3037109375, 4.6015625, 4.8994140625, 5.197265625, 5.4951171875, 5.79296875, 6.0908203125, 6.388671875, 6.6865234375, 6.984375, 7.2822265625, 7.580078125, 7.8779296875, 8.17578125, 8.4736328125, 8.771484375, 9.0693359375, 9.3671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 15.0, 19.0, 35.0, 36.0, 84.0, 117.0, 222.0, 303.0, 510.0, 752.0, 1215.0, 1950.0, 2971.0, 4783.0, 7760.0, 12449.0, 20273.0, 32526.0, 50170.0, 72743.0, 99217.0, 122318.0, 133157.0, 128601.0, 109842.0, 83732.0, 58756.0, 38612.0, 24521.0, 15477.0, 9633.0, 5785.0, 3596.0, 2384.0, 1443.0, 902.0, 565.0, 371.0, 220.0, 185.0, 120.0, 60.0, 40.0, 32.0, 14.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.60430908203125, -5.4156494140625, -5.22698974609375, -5.038330078125, -4.84967041015625, -4.6610107421875, -4.47235107421875, -4.28369140625, -4.09503173828125, -3.9063720703125, -3.71771240234375, -3.529052734375, -3.34039306640625, -3.1517333984375, -2.96307373046875, -2.7744140625, -2.58575439453125, -2.3970947265625, -2.20843505859375, -2.019775390625, -1.83111572265625, -1.6424560546875, -1.45379638671875, -1.26513671875, -1.07647705078125, -0.8878173828125, -0.69915771484375, -0.510498046875, -0.32183837890625, -0.1331787109375, 0.05548095703125, 0.244140625, 0.43280029296875, 0.6214599609375, 0.81011962890625, 0.998779296875, 1.18743896484375, 1.3760986328125, 1.56475830078125, 1.75341796875, 1.94207763671875, 2.1307373046875, 2.31939697265625, 2.508056640625, 2.69671630859375, 2.8853759765625, 3.07403564453125, 3.2626953125, 3.45135498046875, 3.6400146484375, 3.82867431640625, 4.017333984375, 4.20599365234375, 4.3946533203125, 4.58331298828125, 4.77197265625, 4.96063232421875, 5.1492919921875, 5.33795166015625, 5.526611328125, 5.71527099609375, 5.9039306640625, 6.09259033203125, 6.28125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 25.0, 16.0, 15.0, 28.0, 28.0, 29.0, 42.0, 43.0, 49.0, 44.0, 64.0, 42.0, 44.0, 50.0, 44.0, 39.0, 38.0, 43.0, 35.0, 31.0, 33.0, 28.0, 21.0, 10.0, 14.0, 11.0, 14.0, 9.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.0007410049438476562, -0.0007216185331344604, -0.0007022321224212646, -0.0006828457117080688, -0.000663459300994873, -0.0006440728902816772, -0.0006246864795684814, -0.0006053000688552856, -0.0005859136581420898, -0.000566527247428894, -0.0005471408367156982, -0.0005277544260025024, -0.0005083680152893066, -0.0004889816045761108, -0.00046959519386291504, -0.00045020878314971924, -0.00043082237243652344, -0.00041143596172332764, -0.00039204955101013184, -0.00037266314029693604, -0.00035327672958374023, -0.00033389031887054443, -0.00031450390815734863, -0.00029511749744415283, -0.00027573108673095703, -0.00025634467601776123, -0.00023695826530456543, -0.00021757185459136963, -0.00019818544387817383, -0.00017879903316497803, -0.00015941262245178223, -0.00014002621173858643, -0.00012063980102539062, -0.00010125339031219482, -8.186697959899902e-05, -6.248056888580322e-05, -4.309415817260742e-05, -2.370774745941162e-05, -4.32133674621582e-06, 1.506507396697998e-05, 3.445148468017578e-05, 5.383789539337158e-05, 7.322430610656738e-05, 9.261071681976318e-05, 0.00011199712753295898, 0.00013138353824615479, 0.00015076994895935059, 0.0001701563596725464, 0.0001895427703857422, 0.000208929181098938, 0.0002283155918121338, 0.0002477020025253296, 0.0002670884132385254, 0.0002864748239517212, 0.000305861234664917, 0.0003252476453781128, 0.0003446340560913086, 0.0003640204668045044, 0.0003834068775177002, 0.000402793288230896, 0.0004221796989440918, 0.0004415661096572876, 0.0004609525203704834, 0.0004803389310836792, 0.000499725341796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 16.0, 17.0, 37.0, 48.0, 84.0, 88.0, 170.0, 245.0, 421.0, 666.0, 1055.0, 1701.0, 2998.0, 5193.0, 8881.0, 15601.0, 27600.0, 47137.0, 77124.0, 115317.0, 149204.0, 161505.0, 146099.0, 110049.0, 72667.0, 44107.0, 25699.0, 14729.0, 8260.0, 4767.0, 2757.0, 1599.0, 1048.0, 581.0, 365.0, 250.0, 159.0, 118.0, 55.0, 36.0, 26.0, 28.0, 16.0, 12.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-9.125, -8.86749267578125, -8.6099853515625, -8.35247802734375, -8.094970703125, -7.83746337890625, -7.5799560546875, -7.32244873046875, -7.06494140625, -6.80743408203125, -6.5499267578125, -6.29241943359375, -6.034912109375, -5.77740478515625, -5.5198974609375, -5.26239013671875, -5.0048828125, -4.74737548828125, -4.4898681640625, -4.23236083984375, -3.974853515625, -3.71734619140625, -3.4598388671875, -3.20233154296875, -2.94482421875, -2.68731689453125, -2.4298095703125, -2.17230224609375, -1.914794921875, -1.65728759765625, -1.3997802734375, -1.14227294921875, -0.884765625, -0.62725830078125, -0.3697509765625, -0.11224365234375, 0.145263671875, 0.40277099609375, 0.6602783203125, 0.91778564453125, 1.17529296875, 1.43280029296875, 1.6903076171875, 1.94781494140625, 2.205322265625, 2.46282958984375, 2.7203369140625, 2.97784423828125, 3.2353515625, 3.49285888671875, 3.7503662109375, 4.00787353515625, 4.265380859375, 4.52288818359375, 4.7803955078125, 5.03790283203125, 5.29541015625, 5.55291748046875, 5.8104248046875, 6.06793212890625, 6.325439453125, 6.58294677734375, 6.8404541015625, 7.09796142578125, 7.35546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 7.0, 7.0, 6.0, 6.0, 13.0, 14.0, 23.0, 19.0, 26.0, 18.0, 36.0, 39.0, 42.0, 39.0, 53.0, 48.0, 48.0, 41.0, 50.0, 64.0, 46.0, 45.0, 47.0, 39.0, 35.0, 29.0, 29.0, 21.0, 16.0, 15.0, 9.0, 13.0, 7.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.8828125, -2.7989501953125, -2.715087890625, -2.6312255859375, -2.54736328125, -2.4635009765625, -2.379638671875, -2.2957763671875, -2.2119140625, -2.1280517578125, -2.044189453125, -1.9603271484375, -1.87646484375, -1.7926025390625, -1.708740234375, -1.6248779296875, -1.541015625, -1.4571533203125, -1.373291015625, -1.2894287109375, -1.20556640625, -1.1217041015625, -1.037841796875, -0.9539794921875, -0.8701171875, -0.7862548828125, -0.702392578125, -0.6185302734375, -0.53466796875, -0.4508056640625, -0.366943359375, -0.2830810546875, -0.19921875, -0.1153564453125, -0.031494140625, 0.0523681640625, 0.13623046875, 0.2200927734375, 0.303955078125, 0.3878173828125, 0.4716796875, 0.5555419921875, 0.639404296875, 0.7232666015625, 0.80712890625, 0.8909912109375, 0.974853515625, 1.0587158203125, 1.142578125, 1.2264404296875, 1.310302734375, 1.3941650390625, 1.47802734375, 1.5618896484375, 1.645751953125, 1.7296142578125, 1.8134765625, 1.8973388671875, 1.981201171875, 2.0650634765625, 2.14892578125, 2.2327880859375, 2.316650390625, 2.4005126953125, 2.484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 4.0, 8.0, 13.0, 13.0, 11.0, 24.0, 13.0, 35.0, 28.0, 29.0, 42.0, 39.0, 41.0, 37.0, 56.0, 40.0, 42.0, 35.0, 47.0, 54.0, 44.0, 44.0, 43.0, 35.0, 35.0, 28.0, 32.0, 22.0, 18.0, 14.0, 16.0, 9.0, 3.0, 8.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.99200439453125, -17.451509475708008, -16.911012649536133, -16.37051773071289, -15.830022811889648, -15.28952693939209, -14.749031066894531, -14.208536148071289, -13.668041229248047, -13.127545356750488, -12.587050437927246, -12.046554565429688, -11.506059646606445, -10.965563774108887, -10.425067901611328, -9.884572982788086, -9.344077110290527, -8.803581237792969, -8.263086318969727, -7.722590446472168, -7.182095527648926, -6.641599655151367, -6.101104259490967, -5.560608863830566, -5.020113468170166, -4.479618072509766, -3.9391226768493652, -3.3986270427703857, -2.8581316471099854, -2.317636251449585, -1.7771406173706055, -1.236645221710205, -0.6961498260498047, -0.15565437078475952, 0.38484108448028564, 0.9253365993499756, 1.465831995010376, 2.0063273906707764, 2.546823024749756, 3.0873184204101562, 3.6278138160705566, 4.168309211730957, 4.708804607391357, 5.249300003051758, 5.789795875549316, 6.330290794372559, 6.870786666870117, 7.411282062530518, 7.951777458190918, 8.492273330688477, 9.032768249511719, 9.573264122009277, 10.11375904083252, 10.654254913330078, 11.19474983215332, 11.735245704650879, 12.275741577148438, 12.816237449645996, 13.356732368469238, 13.897228240966797, 14.437723159790039, 14.978219032287598, 15.518714904785156, 16.0592098236084, 16.59970474243164]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 1.0, 4.0, 8.0, 9.0, 10.0, 27.0, 19.0, 18.0, 27.0, 25.0, 24.0, 26.0, 34.0, 31.0, 34.0, 38.0, 49.0, 40.0, 32.0, 38.0, 44.0, 32.0, 43.0, 35.0, 39.0, 35.0, 26.0, 34.0, 31.0, 26.0, 18.0, 16.0, 23.0, 12.0, 11.0, 10.0, 9.0, 9.0, 10.0, 6.0, 11.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-15.185629844665527, -14.681742668151855, -14.177855491638184, -13.673968315124512, -13.17008113861084, -12.666193962097168, -12.162307739257812, -11.65842056274414, -11.154533386230469, -10.650646209716797, -10.146759033203125, -9.642871856689453, -9.138984680175781, -8.63509750366211, -8.131210327148438, -7.627323627471924, -7.123435974121094, -6.619548797607422, -6.11566162109375, -5.611774444580078, -5.107887268066406, -4.604000091552734, -4.100113391876221, -3.596226215362549, -3.092339038848877, -2.588451862335205, -2.084564685821533, -1.5806777477264404, -1.0767905712127686, -0.5729033946990967, -0.0690164566040039, 0.43487071990966797, 0.9387569427490234, 1.4426441192626953, 1.9465311765670776, 2.45041823387146, 2.954305410385132, 3.4581925868988037, 3.9620795249938965, 4.465966701507568, 4.96985387802124, 5.473741054534912, 5.977628231048584, 6.481514930725098, 6.9854021072387695, 7.489289283752441, 7.993176460266113, 8.497063636779785, 9.000950813293457, 9.504837989807129, 10.0087251663208, 10.512612342834473, 11.016499519348145, 11.520386695861816, 12.024272918701172, 12.528160095214844, 13.032047271728516, 13.535934448242188, 14.03982162475586, 14.543708801269531, 15.047595977783203, 15.551483154296875, 16.055370330810547, 16.55925750732422, 17.06314468383789]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 8.0, 8.0, 13.0, 10.0, 27.0, 37.0, 51.0, 95.0, 156.0, 234.0, 367.0, 588.0, 931.0, 1442.0, 2391.0, 4084.0, 6710.0, 11268.0, 19001.0, 32608.0, 55283.0, 92105.0, 152198.0, 238977.0, 353704.0, 473272.0, 559128.0, 570703.0, 503368.0, 390835.0, 272728.0, 177345.0, 109290.0, 66122.0, 39295.0, 23622.0, 14007.0, 8513.0, 5232.0, 3135.0, 1921.0, 1251.0, 795.0, 500.0, 335.0, 200.0, 132.0, 86.0, 61.0, 40.0, 28.0, 19.0, 10.0, 7.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 4.0], "bins": [-14.7578125, -14.2686767578125, -13.779541015625, -13.2904052734375, -12.80126953125, -12.3121337890625, -11.822998046875, -11.3338623046875, -10.8447265625, -10.3555908203125, -9.866455078125, -9.3773193359375, -8.88818359375, -8.3990478515625, -7.909912109375, -7.4207763671875, -6.931640625, -6.4425048828125, -5.953369140625, -5.4642333984375, -4.97509765625, -4.4859619140625, -3.996826171875, -3.5076904296875, -3.0185546875, -2.5294189453125, -2.040283203125, -1.5511474609375, -1.06201171875, -0.5728759765625, -0.083740234375, 0.4053955078125, 0.89453125, 1.3836669921875, 1.872802734375, 2.3619384765625, 2.85107421875, 3.3402099609375, 3.829345703125, 4.3184814453125, 4.8076171875, 5.2967529296875, 5.785888671875, 6.2750244140625, 6.76416015625, 7.2532958984375, 7.742431640625, 8.2315673828125, 8.720703125, 9.2098388671875, 9.698974609375, 10.1881103515625, 10.67724609375, 11.1663818359375, 11.655517578125, 12.1446533203125, 12.6337890625, 13.1229248046875, 13.612060546875, 14.1011962890625, 14.59033203125, 15.0794677734375, 15.568603515625, 16.0577392578125, 16.546875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 2.0, 3.0, 5.0, 11.0, 7.0, 19.0, 20.0, 24.0, 17.0, 26.0, 24.0, 22.0, 36.0, 30.0, 28.0, 40.0, 42.0, 43.0, 36.0, 38.0, 42.0, 34.0, 40.0, 39.0, 34.0, 37.0, 32.0, 36.0, 27.0, 25.0, 28.0, 14.0, 22.0, 14.0, 17.0, 11.0, 7.0, 12.0, 4.0, 11.0, 9.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.3984375, -12.9482421875, -12.498046875, -12.0478515625, -11.59765625, -11.1474609375, -10.697265625, -10.2470703125, -9.796875, -9.3466796875, -8.896484375, -8.4462890625, -7.99609375, -7.5458984375, -7.095703125, -6.6455078125, -6.1953125, -5.7451171875, -5.294921875, -4.8447265625, -4.39453125, -3.9443359375, -3.494140625, -3.0439453125, -2.59375, -2.1435546875, -1.693359375, -1.2431640625, -0.79296875, -0.3427734375, 0.107421875, 0.5576171875, 1.0078125, 1.4580078125, 1.908203125, 2.3583984375, 2.80859375, 3.2587890625, 3.708984375, 4.1591796875, 4.609375, 5.0595703125, 5.509765625, 5.9599609375, 6.41015625, 6.8603515625, 7.310546875, 7.7607421875, 8.2109375, 8.6611328125, 9.111328125, 9.5615234375, 10.01171875, 10.4619140625, 10.912109375, 11.3623046875, 11.8125, 12.2626953125, 12.712890625, 13.1630859375, 13.61328125, 14.0634765625, 14.513671875, 14.9638671875, 15.4140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 11.0, 13.0, 24.0, 35.0, 76.0, 99.0, 183.0, 300.0, 529.0, 857.0, 1425.0, 2461.0, 4268.0, 7505.0, 13564.0, 24043.0, 43067.0, 74973.0, 128164.0, 207203.0, 315396.0, 438688.0, 541242.0, 580281.0, 541707.0, 438082.0, 317704.0, 208394.0, 128679.0, 75904.0, 43234.0, 24364.0, 13497.0, 7618.0, 4479.0, 2587.0, 1453.0, 872.0, 494.0, 315.0, 177.0, 111.0, 75.0, 45.0, 29.0, 21.0, 14.0, 5.0, 7.0, 2.0, 5.0, 1.0], "bins": [-19.421875, -18.8748779296875, -18.327880859375, -17.7808837890625, -17.23388671875, -16.6868896484375, -16.139892578125, -15.5928955078125, -15.0458984375, -14.4989013671875, -13.951904296875, -13.4049072265625, -12.85791015625, -12.3109130859375, -11.763916015625, -11.2169189453125, -10.669921875, -10.1229248046875, -9.575927734375, -9.0289306640625, -8.48193359375, -7.9349365234375, -7.387939453125, -6.8409423828125, -6.2939453125, -5.7469482421875, -5.199951171875, -4.6529541015625, -4.10595703125, -3.5589599609375, -3.011962890625, -2.4649658203125, -1.91796875, -1.3709716796875, -0.823974609375, -0.2769775390625, 0.27001953125, 0.8170166015625, 1.364013671875, 1.9110107421875, 2.4580078125, 3.0050048828125, 3.552001953125, 4.0989990234375, 4.64599609375, 5.1929931640625, 5.739990234375, 6.2869873046875, 6.833984375, 7.3809814453125, 7.927978515625, 8.4749755859375, 9.02197265625, 9.5689697265625, 10.115966796875, 10.6629638671875, 11.2099609375, 11.7569580078125, 12.303955078125, 12.8509521484375, 13.39794921875, 13.9449462890625, 14.491943359375, 15.0389404296875, 15.5859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 16.0, 12.0, 11.0, 18.0, 21.0, 24.0, 48.0, 33.0, 50.0, 65.0, 95.0, 109.0, 105.0, 107.0, 131.0, 162.0, 148.0, 174.0, 187.0, 190.0, 200.0, 178.0, 196.0, 188.0, 179.0, 199.0, 197.0, 147.0, 120.0, 130.0, 106.0, 81.0, 75.0, 81.0, 54.0, 45.0, 47.0, 37.0, 26.0, 22.0, 19.0, 8.0, 11.0, 5.0, 2.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.33489990234375, -6.1229248046875, -5.91094970703125, -5.698974609375, -5.48699951171875, -5.2750244140625, -5.06304931640625, -4.85107421875, -4.63909912109375, -4.4271240234375, -4.21514892578125, -4.003173828125, -3.79119873046875, -3.5792236328125, -3.36724853515625, -3.1552734375, -2.94329833984375, -2.7313232421875, -2.51934814453125, -2.307373046875, -2.09539794921875, -1.8834228515625, -1.67144775390625, -1.45947265625, -1.24749755859375, -1.0355224609375, -0.82354736328125, -0.611572265625, -0.39959716796875, -0.1876220703125, 0.02435302734375, 0.236328125, 0.44830322265625, 0.6602783203125, 0.87225341796875, 1.084228515625, 1.29620361328125, 1.5081787109375, 1.72015380859375, 1.93212890625, 2.14410400390625, 2.3560791015625, 2.56805419921875, 2.780029296875, 2.99200439453125, 3.2039794921875, 3.41595458984375, 3.6279296875, 3.83990478515625, 4.0518798828125, 4.26385498046875, 4.475830078125, 4.68780517578125, 4.8997802734375, 5.11175537109375, 5.32373046875, 5.53570556640625, 5.7476806640625, 5.95965576171875, 6.171630859375, 6.38360595703125, 6.5955810546875, 6.80755615234375, 7.01953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 6.0, 3.0, 16.0, 12.0, 20.0, 26.0, 21.0, 24.0, 37.0, 49.0, 54.0, 53.0, 57.0, 49.0, 44.0, 50.0, 75.0, 49.0, 56.0, 51.0, 40.0, 31.0, 42.0, 28.0, 22.0, 18.0, 10.0, 11.0, 17.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.895763397216797, -16.224443435668945, -15.553123474121094, -14.881803512573242, -14.21048355102539, -13.539163589477539, -12.867844581604004, -12.196524620056152, -11.5252046585083, -10.85388469696045, -10.182564735412598, -9.511245727539062, -8.839925765991211, -8.16860580444336, -7.497285842895508, -6.825965881347656, -6.154645919799805, -5.483325958251953, -4.812005996704102, -4.140686511993408, -3.4693665504455566, -2.798046588897705, -2.1267271041870117, -1.4554071426391602, -0.7840871810913086, -0.11276733875274658, 0.5585525035858154, 1.229872226715088, 1.9011921882629395, 2.572512149810791, 3.2438316345214844, 3.915151596069336, 4.5864715576171875, 5.257791519165039, 5.929111480712891, 6.600430965423584, 7.2717509269714355, 7.943070888519287, 8.61439037322998, 9.285710334777832, 9.957030296325684, 10.628350257873535, 11.299670219421387, 11.970989227294922, 12.642309188842773, 13.313629150390625, 13.984949111938477, 14.656269073486328, 15.32758903503418, 15.998908996582031, 16.670228958129883, 17.341548919677734, 18.012868881225586, 18.684188842773438, 19.355506896972656, 20.02682876586914, 20.69814682006836, 21.36946678161621, 22.040786743164062, 22.712106704711914, 23.383426666259766, 24.054746627807617, 24.72606658935547, 25.397384643554688, 26.068706512451172]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 8.0, 11.0, 17.0, 9.0, 15.0, 25.0, 22.0, 33.0, 39.0, 38.0, 37.0, 50.0, 38.0, 33.0, 40.0, 43.0, 35.0, 42.0, 59.0, 50.0, 41.0, 37.0, 38.0, 36.0, 20.0, 23.0, 22.0, 18.0, 21.0, 18.0, 13.0, 15.0, 14.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.033568382263184, -14.452958106994629, -13.872347831726074, -13.291738510131836, -12.711128234863281, -12.130517959594727, -11.549907684326172, -10.969297409057617, -10.388687133789062, -9.808076858520508, -9.227466583251953, -8.646856307983398, -8.06624698638916, -7.4856367111206055, -6.905026435852051, -6.324416637420654, -5.743806838989258, -5.163196563720703, -4.582586765289307, -4.001976490020752, -3.4213664531707764, -2.840756416320801, -2.260146141052246, -1.6795363426208496, -1.098926067352295, -0.5183159708976746, 0.0622941255569458, 0.6429042816162109, 1.2235143184661865, 1.804124355316162, 2.384734630584717, 2.9653444290161133, 3.5459537506103516, 4.126564025878906, 4.707173824310303, 5.287784099578857, 5.868393898010254, 6.449004173278809, 7.029614448547363, 7.61022424697876, 8.190834045410156, 8.771444320678711, 9.352054595947266, 9.93266487121582, 10.513274192810059, 11.093884468078613, 11.674494743347168, 12.255104064941406, 12.835715293884277, 13.416325569152832, 13.996935844421387, 14.577545166015625, 15.15815544128418, 15.738765716552734, 16.31937599182129, 16.899986267089844, 17.4805965423584, 18.061206817626953, 18.641817092895508, 19.222427368164062, 19.803037643432617, 20.383647918701172, 20.964256286621094, 21.54486656188965, 22.125476837158203]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 10.0, 11.0, 20.0, 47.0, 48.0, 62.0, 137.0, 232.0, 316.0, 513.0, 787.0, 1369.0, 2304.0, 4004.0, 6777.0, 11559.0, 19740.0, 33553.0, 55081.0, 85302.0, 121708.0, 152080.0, 157531.0, 133937.0, 97781.0, 64672.0, 39952.0, 24246.0, 14262.0, 8323.0, 4891.0, 2949.0, 1691.0, 1051.0, 600.0, 374.0, 233.0, 147.0, 94.0, 73.0, 36.0, 21.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.357177734375, -3.24951171875, -3.141845703125, -3.0341796875, -2.926513671875, -2.81884765625, -2.711181640625, -2.603515625, -2.495849609375, -2.38818359375, -2.280517578125, -2.1728515625, -2.065185546875, -1.95751953125, -1.849853515625, -1.7421875, -1.634521484375, -1.52685546875, -1.419189453125, -1.3115234375, -1.203857421875, -1.09619140625, -0.988525390625, -0.880859375, -0.773193359375, -0.66552734375, -0.557861328125, -0.4501953125, -0.342529296875, -0.23486328125, -0.127197265625, -0.01953125, 0.088134765625, 0.19580078125, 0.303466796875, 0.4111328125, 0.518798828125, 0.62646484375, 0.734130859375, 0.841796875, 0.949462890625, 1.05712890625, 1.164794921875, 1.2724609375, 1.380126953125, 1.48779296875, 1.595458984375, 1.703125, 1.810791015625, 1.91845703125, 2.026123046875, 2.1337890625, 2.241455078125, 2.34912109375, 2.456787109375, 2.564453125, 2.672119140625, 2.77978515625, 2.887451171875, 2.9951171875, 3.102783203125, 3.21044921875, 3.318115234375, 3.42578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 16.0, 10.0, 14.0, 26.0, 21.0, 32.0, 40.0, 38.0, 36.0, 53.0, 38.0, 30.0, 38.0, 43.0, 37.0, 44.0, 63.0, 46.0, 42.0, 36.0, 41.0, 33.0, 20.0, 22.0, 23.0, 17.0, 20.0, 20.0, 13.0, 14.0, 15.0, 8.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.4422607421875, -13.861083984375, -13.2799072265625, -12.69873046875, -12.1175537109375, -11.536376953125, -10.9552001953125, -10.3740234375, -9.7928466796875, -9.211669921875, -8.6304931640625, -8.04931640625, -7.4681396484375, -6.886962890625, -6.3057861328125, -5.724609375, -5.1434326171875, -4.562255859375, -3.9810791015625, -3.39990234375, -2.8187255859375, -2.237548828125, -1.6563720703125, -1.0751953125, -0.4940185546875, 0.087158203125, 0.6683349609375, 1.24951171875, 1.8306884765625, 2.411865234375, 2.9930419921875, 3.57421875, 4.1553955078125, 4.736572265625, 5.3177490234375, 5.89892578125, 6.4801025390625, 7.061279296875, 7.6424560546875, 8.2236328125, 8.8048095703125, 9.385986328125, 9.9671630859375, 10.54833984375, 11.1295166015625, 11.710693359375, 12.2918701171875, 12.873046875, 13.4542236328125, 14.035400390625, 14.6165771484375, 15.19775390625, 15.7789306640625, 16.360107421875, 16.9412841796875, 17.5224609375, 18.1036376953125, 18.684814453125, 19.2659912109375, 19.84716796875, 20.4283447265625, 21.009521484375, 21.5906982421875, 22.171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 6.0, 13.0, 12.0, 19.0, 17.0, 30.0, 33.0, 56.0, 91.0, 114.0, 181.0, 285.0, 371.0, 583.0, 814.0, 1270.0, 1901.0, 2906.0, 4546.0, 7116.0, 11355.0, 19305.0, 38713.0, 626233.0, 257485.0, 30311.0, 16578.0, 10005.0, 6463.0, 3972.0, 2572.0, 1690.0, 1151.0, 737.0, 525.0, 357.0, 207.0, 141.0, 122.0, 79.0, 53.0, 36.0, 27.0, 18.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.015625, -5.814208984375, -5.61279296875, -5.411376953125, -5.2099609375, -5.008544921875, -4.80712890625, -4.605712890625, -4.404296875, -4.202880859375, -4.00146484375, -3.800048828125, -3.5986328125, -3.397216796875, -3.19580078125, -2.994384765625, -2.79296875, -2.591552734375, -2.39013671875, -2.188720703125, -1.9873046875, -1.785888671875, -1.58447265625, -1.383056640625, -1.181640625, -0.980224609375, -0.77880859375, -0.577392578125, -0.3759765625, -0.174560546875, 0.02685546875, 0.228271484375, 0.4296875, 0.631103515625, 0.83251953125, 1.033935546875, 1.2353515625, 1.436767578125, 1.63818359375, 1.839599609375, 2.041015625, 2.242431640625, 2.44384765625, 2.645263671875, 2.8466796875, 3.048095703125, 3.24951171875, 3.450927734375, 3.65234375, 3.853759765625, 4.05517578125, 4.256591796875, 4.4580078125, 4.659423828125, 4.86083984375, 5.062255859375, 5.263671875, 5.465087890625, 5.66650390625, 5.867919921875, 6.0693359375, 6.270751953125, 6.47216796875, 6.673583984375, 6.875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 15.0, 13.0, 29.0, 21.0, 19.0, 25.0, 23.0, 33.0, 38.0, 40.0, 42.0, 41.0, 36.0, 44.0, 24.0, 39.0, 47.0, 44.0, 36.0, 35.0, 28.0, 29.0, 32.0, 20.0, 27.0, 21.0, 26.0, 24.0, 14.0, 17.0, 14.0, 12.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.96875, -10.63720703125, -10.3056640625, -9.97412109375, -9.642578125, -9.31103515625, -8.9794921875, -8.64794921875, -8.31640625, -7.98486328125, -7.6533203125, -7.32177734375, -6.990234375, -6.65869140625, -6.3271484375, -5.99560546875, -5.6640625, -5.33251953125, -5.0009765625, -4.66943359375, -4.337890625, -4.00634765625, -3.6748046875, -3.34326171875, -3.01171875, -2.68017578125, -2.3486328125, -2.01708984375, -1.685546875, -1.35400390625, -1.0224609375, -0.69091796875, -0.359375, -0.02783203125, 0.3037109375, 0.63525390625, 0.966796875, 1.29833984375, 1.6298828125, 1.96142578125, 2.29296875, 2.62451171875, 2.9560546875, 3.28759765625, 3.619140625, 3.95068359375, 4.2822265625, 4.61376953125, 4.9453125, 5.27685546875, 5.6083984375, 5.93994140625, 6.271484375, 6.60302734375, 6.9345703125, 7.26611328125, 7.59765625, 7.92919921875, 8.2607421875, 8.59228515625, 8.923828125, 9.25537109375, 9.5869140625, 9.91845703125, 10.25]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 15.0, 25.0, 24.0, 38.0, 62.0, 102.0, 155.0, 224.0, 482.0, 848.0, 1722.0, 3599.0, 8129.0, 18435.0, 47163.0, 882783.0, 49859.0, 19010.0, 8256.0, 3789.0, 1765.0, 900.0, 471.0, 290.0, 127.0, 90.0, 51.0, 38.0, 21.0, 16.0, 14.0, 8.0, 10.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.954803466796875, -0.92132568359375, -0.887847900390625, -0.8543701171875, -0.820892333984375, -0.78741455078125, -0.753936767578125, -0.720458984375, -0.686981201171875, -0.65350341796875, -0.620025634765625, -0.5865478515625, -0.553070068359375, -0.51959228515625, -0.486114501953125, -0.45263671875, -0.419158935546875, -0.38568115234375, -0.352203369140625, -0.3187255859375, -0.285247802734375, -0.25177001953125, -0.218292236328125, -0.184814453125, -0.151336669921875, -0.11785888671875, -0.084381103515625, -0.0509033203125, -0.017425537109375, 0.01605224609375, 0.049530029296875, 0.0830078125, 0.116485595703125, 0.14996337890625, 0.183441162109375, 0.2169189453125, 0.250396728515625, 0.28387451171875, 0.317352294921875, 0.350830078125, 0.384307861328125, 0.41778564453125, 0.451263427734375, 0.4847412109375, 0.518218994140625, 0.55169677734375, 0.585174560546875, 0.61865234375, 0.652130126953125, 0.68560791015625, 0.719085693359375, 0.7525634765625, 0.786041259765625, 0.81951904296875, 0.852996826171875, 0.886474609375, 0.919952392578125, 0.95343017578125, 0.986907958984375, 1.0203857421875, 1.053863525390625, 1.08734130859375, 1.120819091796875, 1.154296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 13.0, 13.0, 21.0, 12.0, 27.0, 31.0, 24.0, 33.0, 52.0, 45.0, 55.0, 55.0, 62.0, 52.0, 61.0, 72.0, 67.0, 39.0, 36.0, 56.0, 43.0, 24.0, 18.0, 16.0, 18.0, 10.0, 18.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.6722438633441925e-05, -2.584792673587799e-05, -2.4973414838314056e-05, -2.4098902940750122e-05, -2.3224391043186188e-05, -2.2349879145622253e-05, -2.147536724805832e-05, -2.0600855350494385e-05, -1.972634345293045e-05, -1.8851831555366516e-05, -1.7977319657802582e-05, -1.7102807760238647e-05, -1.6228295862674713e-05, -1.535378396511078e-05, -1.4479272067546844e-05, -1.360476016998291e-05, -1.2730248272418976e-05, -1.1855736374855042e-05, -1.0981224477291107e-05, -1.0106712579727173e-05, -9.232200682163239e-06, -8.357688784599304e-06, -7.48317688703537e-06, -6.6086649894714355e-06, -5.734153091907501e-06, -4.859641194343567e-06, -3.9851292967796326e-06, -3.1106173992156982e-06, -2.236105501651764e-06, -1.3615936040878296e-06, -4.870817065238953e-07, 3.8743019104003906e-07, 1.2619420886039734e-06, 2.1364539861679077e-06, 3.010965883731842e-06, 3.885477781295776e-06, 4.759989678859711e-06, 5.634501576423645e-06, 6.509013473987579e-06, 7.383525371551514e-06, 8.258037269115448e-06, 9.132549166679382e-06, 1.0007061064243317e-05, 1.0881572961807251e-05, 1.1756084859371185e-05, 1.263059675693512e-05, 1.3505108654499054e-05, 1.4379620552062988e-05, 1.5254132449626923e-05, 1.6128644347190857e-05, 1.700315624475479e-05, 1.7877668142318726e-05, 1.875218003988266e-05, 1.9626691937446594e-05, 2.050120383501053e-05, 2.1375715732574463e-05, 2.2250227630138397e-05, 2.312473952770233e-05, 2.3999251425266266e-05, 2.48737633228302e-05, 2.5748275220394135e-05, 2.662278711795807e-05, 2.7497299015522003e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 4.0, 7.0, 13.0, 18.0, 21.0, 30.0, 41.0, 83.0, 96.0, 151.0, 216.0, 342.0, 487.0, 664.0, 986.0, 1411.0, 2041.0, 3015.0, 4224.0, 6214.0, 8953.0, 13219.0, 19179.0, 27422.0, 39191.0, 54609.0, 75522.0, 99585.0, 123500.0, 130278.0, 115364.0, 91388.0, 68003.0, 48839.0, 35088.0, 24335.0, 16794.0, 11513.0, 7961.0, 5476.0, 3835.0, 2599.0, 1802.0, 1260.0, 911.0, 558.0, 441.0, 268.0, 202.0, 123.0, 102.0, 63.0, 29.0, 34.0, 16.0, 18.0, 8.0, 9.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.54833984375, -0.5308380126953125, -0.513336181640625, -0.4958343505859375, -0.47833251953125, -0.4608306884765625, -0.443328857421875, -0.4258270263671875, -0.4083251953125, -0.3908233642578125, -0.373321533203125, -0.3558197021484375, -0.33831787109375, -0.3208160400390625, -0.303314208984375, -0.2858123779296875, -0.268310546875, -0.2508087158203125, -0.233306884765625, -0.2158050537109375, -0.19830322265625, -0.1808013916015625, -0.163299560546875, -0.1457977294921875, -0.1282958984375, -0.1107940673828125, -0.093292236328125, -0.0757904052734375, -0.05828857421875, -0.0407867431640625, -0.023284912109375, -0.0057830810546875, 0.01171875, 0.0292205810546875, 0.046722412109375, 0.0642242431640625, 0.08172607421875, 0.0992279052734375, 0.116729736328125, 0.1342315673828125, 0.1517333984375, 0.1692352294921875, 0.186737060546875, 0.2042388916015625, 0.22174072265625, 0.2392425537109375, 0.256744384765625, 0.2742462158203125, 0.291748046875, 0.3092498779296875, 0.326751708984375, 0.3442535400390625, 0.36175537109375, 0.3792572021484375, 0.396759033203125, 0.4142608642578125, 0.4317626953125, 0.4492645263671875, 0.466766357421875, 0.4842681884765625, 0.50177001953125, 0.5192718505859375, 0.536773681640625, 0.5542755126953125, 0.57177734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 7.0, 16.0, 19.0, 16.0, 36.0, 39.0, 52.0, 56.0, 88.0, 105.0, 80.0, 87.0, 81.0, 56.0, 51.0, 28.0, 35.0, 34.0, 21.0, 22.0, 10.0, 10.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3353767395019531, -0.32212066650390625, -0.3088645935058594, -0.2956085205078125, -0.2823524475097656, -0.26909637451171875, -0.2558403015136719, -0.242584228515625, -0.22932815551757812, -0.21607208251953125, -0.20281600952148438, -0.1895599365234375, -0.17630386352539062, -0.16304779052734375, -0.14979171752929688, -0.13653564453125, -0.12327957153320312, -0.11002349853515625, -0.09676742553710938, -0.0835113525390625, -0.07025527954101562, -0.05699920654296875, -0.043743133544921875, -0.030487060546875, -0.017230987548828125, -0.00397491455078125, 0.009281158447265625, 0.0225372314453125, 0.035793304443359375, 0.04904937744140625, 0.062305450439453125, 0.0755615234375, 0.08881759643554688, 0.10207366943359375, 0.11532974243164062, 0.1285858154296875, 0.14184188842773438, 0.15509796142578125, 0.16835403442382812, 0.181610107421875, 0.19486618041992188, 0.20812225341796875, 0.22137832641601562, 0.2346343994140625, 0.24789047241210938, 0.26114654541015625, 0.2744026184082031, 0.28765869140625, 0.3009147644042969, 0.31417083740234375, 0.3274269104003906, 0.3406829833984375, 0.3539390563964844, 0.36719512939453125, 0.3804512023925781, 0.393707275390625, 0.4069633483886719, 0.42021942138671875, 0.4334754943847656, 0.4467315673828125, 0.4599876403808594, 0.47324371337890625, 0.4864997863769531, 0.499755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 6.0, 12.0, 12.0, 16.0, 24.0, 29.0, 23.0, 37.0, 48.0, 49.0, 63.0, 51.0, 47.0, 47.0, 56.0, 73.0, 53.0, 57.0, 53.0, 30.0, 43.0, 37.0, 25.0, 24.0, 18.0, 14.0, 15.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.340423583984375, -16.648508071899414, -15.95659065246582, -15.264674186706543, -14.572757720947266, -13.880841255187988, -13.188924789428711, -12.49700927734375, -11.805091857910156, -11.113175392150879, -10.421258926391602, -9.729342460632324, -9.037425994873047, -8.34550952911377, -7.65359354019165, -6.961677074432373, -6.269761085510254, -5.577844619750977, -4.885928153991699, -4.194011688232422, -3.5020954608917236, -2.8101789951324463, -2.118262767791748, -1.4263463020324707, -0.7344298362731934, -0.04251343011856079, 0.6494029760360718, 1.3413193225860596, 2.033235788345337, 2.7251522541046143, 3.4170684814453125, 4.10898494720459, 4.800901412963867, 5.4928178787231445, 6.184734344482422, 6.876650810241699, 7.568567276000977, 8.260483741760254, 8.952400207519531, 9.644315719604492, 10.336233139038086, 11.028149604797363, 11.72006607055664, 12.411982536315918, 13.103899002075195, 13.795815467834473, 14.48773193359375, 15.179647445678711, 15.871563911437988, 16.563480377197266, 17.255395889282227, 17.94731330871582, 18.63922882080078, 19.331146240234375, 20.023061752319336, 20.71497917175293, 21.40689468383789, 22.09881019592285, 22.790727615356445, 23.482643127441406, 24.174560546875, 24.86647605895996, 25.558393478393555, 26.250308990478516, 26.94222640991211]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 11.0, 18.0, 8.0, 15.0, 25.0, 24.0, 31.0, 37.0, 40.0, 38.0, 52.0, 37.0, 30.0, 45.0, 40.0, 34.0, 46.0, 58.0, 50.0, 39.0, 37.0, 38.0, 36.0, 18.0, 25.0, 21.0, 20.0, 21.0, 20.0, 12.0, 10.0, 16.0, 9.0, 4.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.009733200073242, -14.427873611450195, -13.846014022827148, -13.264155387878418, -12.682295799255371, -12.100436210632324, -11.518577575683594, -10.936717987060547, -10.3548583984375, -9.772998809814453, -9.191139221191406, -8.609280586242676, -8.027420997619629, -7.445561408996582, -6.863702297210693, -6.281843185424805, -5.699983596801758, -5.118124008178711, -4.536264896392822, -3.9544055461883545, -3.3725461959838867, -2.790686845779419, -2.208827495574951, -1.6269683837890625, -1.0451087951660156, -0.46324944496154785, 0.11860990524291992, 0.7004692554473877, 1.2823286056518555, 1.8641879558563232, 2.446047306060791, 3.0279064178466797, 3.6097679138183594, 4.191627502441406, 4.773486614227295, 5.355345726013184, 5.9372053146362305, 6.519064903259277, 7.100924015045166, 7.682783126831055, 8.264642715454102, 8.846502304077148, 9.428361892700195, 10.010220527648926, 10.592080116271973, 11.17393970489502, 11.75579833984375, 12.337657928466797, 12.919517517089844, 13.50137710571289, 14.083236694335938, 14.665095329284668, 15.246954917907715, 15.828814506530762, 16.410673141479492, 16.99253273010254, 17.574392318725586, 18.156251907348633, 18.73811149597168, 19.319971084594727, 19.90182876586914, 20.483688354492188, 21.065547943115234, 21.64740753173828, 22.229267120361328]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 8.0, 12.0, 26.0, 40.0, 69.0, 112.0, 184.0, 290.0, 454.0, 741.0, 1201.0, 1894.0, 2783.0, 4592.0, 7008.0, 10834.0, 16136.0, 23913.0, 33868.0, 45959.0, 60985.0, 75862.0, 89043.0, 99212.0, 102521.0, 99030.0, 88828.0, 75111.0, 59846.0, 45685.0, 33332.0, 23365.0, 15791.0, 10574.0, 6968.0, 4585.0, 2806.0, 1865.0, 1186.0, 693.0, 450.0, 265.0, 170.0, 100.0, 61.0, 40.0, 25.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.83056640625, -11.4423828125, -11.05419921875, -10.666015625, -10.27783203125, -9.8896484375, -9.50146484375, -9.11328125, -8.72509765625, -8.3369140625, -7.94873046875, -7.560546875, -7.17236328125, -6.7841796875, -6.39599609375, -6.0078125, -5.61962890625, -5.2314453125, -4.84326171875, -4.455078125, -4.06689453125, -3.6787109375, -3.29052734375, -2.90234375, -2.51416015625, -2.1259765625, -1.73779296875, -1.349609375, -0.96142578125, -0.5732421875, -0.18505859375, 0.203125, 0.59130859375, 0.9794921875, 1.36767578125, 1.755859375, 2.14404296875, 2.5322265625, 2.92041015625, 3.30859375, 3.69677734375, 4.0849609375, 4.47314453125, 4.861328125, 5.24951171875, 5.6376953125, 6.02587890625, 6.4140625, 6.80224609375, 7.1904296875, 7.57861328125, 7.966796875, 8.35498046875, 8.7431640625, 9.13134765625, 9.51953125, 9.90771484375, 10.2958984375, 10.68408203125, 11.072265625, 11.46044921875, 11.8486328125, 12.23681640625, 12.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 15.0, 12.0, 14.0, 26.0, 25.0, 31.0, 41.0, 39.0, 36.0, 54.0, 36.0, 31.0, 40.0, 44.0, 36.0, 48.0, 55.0, 46.0, 41.0, 44.0, 39.0, 27.0, 19.0, 28.0, 18.0, 22.0, 20.0, 17.0, 12.0, 10.0, 15.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -13.949462890625, -13.38330078125, -12.817138671875, -12.2509765625, -11.684814453125, -11.11865234375, -10.552490234375, -9.986328125, -9.420166015625, -8.85400390625, -8.287841796875, -7.7216796875, -7.155517578125, -6.58935546875, -6.023193359375, -5.45703125, -4.890869140625, -4.32470703125, -3.758544921875, -3.1923828125, -2.626220703125, -2.06005859375, -1.493896484375, -0.927734375, -0.361572265625, 0.20458984375, 0.770751953125, 1.3369140625, 1.903076171875, 2.46923828125, 3.035400390625, 3.6015625, 4.167724609375, 4.73388671875, 5.300048828125, 5.8662109375, 6.432373046875, 6.99853515625, 7.564697265625, 8.130859375, 8.697021484375, 9.26318359375, 9.829345703125, 10.3955078125, 10.961669921875, 11.52783203125, 12.093994140625, 12.66015625, 13.226318359375, 13.79248046875, 14.358642578125, 14.9248046875, 15.490966796875, 16.05712890625, 16.623291015625, 17.189453125, 17.755615234375, 18.32177734375, 18.887939453125, 19.4541015625, 20.020263671875, 20.58642578125, 21.152587890625, 21.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 18.0, 19.0, 41.0, 82.0, 113.0, 169.0, 311.0, 475.0, 736.0, 1169.0, 1885.0, 2834.0, 4386.0, 6632.0, 9853.0, 14481.0, 20949.0, 29346.0, 39861.0, 52376.0, 66198.0, 79680.0, 90352.0, 96493.0, 96657.0, 91579.0, 80764.0, 67831.0, 53932.0, 41518.0, 30446.0, 22122.0, 15147.0, 10300.0, 6947.0, 4567.0, 3025.0, 1917.0, 1204.0, 817.0, 488.0, 336.0, 179.0, 135.0, 61.0, 32.0, 35.0, 22.0, 11.0, 7.0, 9.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.453125, -11.106689453125, -10.76025390625, -10.413818359375, -10.0673828125, -9.720947265625, -9.37451171875, -9.028076171875, -8.681640625, -8.335205078125, -7.98876953125, -7.642333984375, -7.2958984375, -6.949462890625, -6.60302734375, -6.256591796875, -5.91015625, -5.563720703125, -5.21728515625, -4.870849609375, -4.5244140625, -4.177978515625, -3.83154296875, -3.485107421875, -3.138671875, -2.792236328125, -2.44580078125, -2.099365234375, -1.7529296875, -1.406494140625, -1.06005859375, -0.713623046875, -0.3671875, -0.020751953125, 0.32568359375, 0.672119140625, 1.0185546875, 1.364990234375, 1.71142578125, 2.057861328125, 2.404296875, 2.750732421875, 3.09716796875, 3.443603515625, 3.7900390625, 4.136474609375, 4.48291015625, 4.829345703125, 5.17578125, 5.522216796875, 5.86865234375, 6.215087890625, 6.5615234375, 6.907958984375, 7.25439453125, 7.600830078125, 7.947265625, 8.293701171875, 8.64013671875, 8.986572265625, 9.3330078125, 9.679443359375, 10.02587890625, 10.372314453125, 10.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 3.0, 5.0, 5.0, 5.0, 16.0, 5.0, 24.0, 13.0, 25.0, 26.0, 29.0, 35.0, 27.0, 48.0, 32.0, 45.0, 37.0, 41.0, 44.0, 46.0, 44.0, 42.0, 34.0, 38.0, 42.0, 30.0, 30.0, 37.0, 17.0, 19.0, 20.0, 20.0, 18.0, 10.0, 15.0, 13.0, 11.0, 6.0, 6.0, 3.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.5546875, -11.2178955078125, -10.881103515625, -10.5443115234375, -10.20751953125, -9.8707275390625, -9.533935546875, -9.1971435546875, -8.8603515625, -8.5235595703125, -8.186767578125, -7.8499755859375, -7.51318359375, -7.1763916015625, -6.839599609375, -6.5028076171875, -6.166015625, -5.8292236328125, -5.492431640625, -5.1556396484375, -4.81884765625, -4.4820556640625, -4.145263671875, -3.8084716796875, -3.4716796875, -3.1348876953125, -2.798095703125, -2.4613037109375, -2.12451171875, -1.7877197265625, -1.450927734375, -1.1141357421875, -0.77734375, -0.4405517578125, -0.103759765625, 0.2330322265625, 0.56982421875, 0.9066162109375, 1.243408203125, 1.5802001953125, 1.9169921875, 2.2537841796875, 2.590576171875, 2.9273681640625, 3.26416015625, 3.6009521484375, 3.937744140625, 4.2745361328125, 4.611328125, 4.9481201171875, 5.284912109375, 5.6217041015625, 5.95849609375, 6.2952880859375, 6.632080078125, 6.9688720703125, 7.3056640625, 7.6424560546875, 7.979248046875, 8.3160400390625, 8.65283203125, 8.9896240234375, 9.326416015625, 9.6632080078125, 10.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 10.0, 10.0, 12.0, 23.0, 47.0, 71.0, 115.0, 177.0, 291.0, 407.0, 625.0, 1058.0, 1567.0, 2423.0, 3947.0, 5840.0, 9150.0, 13865.0, 20635.0, 29646.0, 41977.0, 56464.0, 72966.0, 88529.0, 100656.0, 105931.0, 103531.0, 93934.0, 79638.0, 62931.0, 47506.0, 34279.0, 23918.0, 15907.0, 10612.0, 7045.0, 4505.0, 2976.0, 1854.0, 1247.0, 774.0, 489.0, 338.0, 230.0, 143.0, 89.0, 54.0, 41.0, 23.0, 18.0, 15.0, 8.0, 14.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5078125, -4.35601806640625, -4.2042236328125, -4.05242919921875, -3.900634765625, -3.74884033203125, -3.5970458984375, -3.44525146484375, -3.29345703125, -3.14166259765625, -2.9898681640625, -2.83807373046875, -2.686279296875, -2.53448486328125, -2.3826904296875, -2.23089599609375, -2.0791015625, -1.92730712890625, -1.7755126953125, -1.62371826171875, -1.471923828125, -1.32012939453125, -1.1683349609375, -1.01654052734375, -0.86474609375, -0.71295166015625, -0.5611572265625, -0.40936279296875, -0.257568359375, -0.10577392578125, 0.0460205078125, 0.19781494140625, 0.349609375, 0.50140380859375, 0.6531982421875, 0.80499267578125, 0.956787109375, 1.10858154296875, 1.2603759765625, 1.41217041015625, 1.56396484375, 1.71575927734375, 1.8675537109375, 2.01934814453125, 2.171142578125, 2.32293701171875, 2.4747314453125, 2.62652587890625, 2.7783203125, 2.93011474609375, 3.0819091796875, 3.23370361328125, 3.385498046875, 3.53729248046875, 3.6890869140625, 3.84088134765625, 3.99267578125, 4.14447021484375, 4.2962646484375, 4.44805908203125, 4.599853515625, 4.75164794921875, 4.9034423828125, 5.05523681640625, 5.20703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 8.0, 7.0, 11.0, 11.0, 18.0, 23.0, 23.0, 16.0, 19.0, 27.0, 30.0, 38.0, 30.0, 38.0, 42.0, 29.0, 41.0, 34.0, 39.0, 31.0, 38.0, 45.0, 44.0, 46.0, 22.0, 26.0, 29.0, 27.0, 29.0, 20.0, 14.0, 17.0, 16.0, 20.0, 13.0, 7.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0005383491516113281, -0.0005207434296607971, -0.0005031377077102661, -0.0004855319857597351, -0.0004679262638092041, -0.0004503205418586731, -0.0004327148199081421, -0.0004151090979576111, -0.0003975033760070801, -0.00037989765405654907, -0.00036229193210601807, -0.00034468621015548706, -0.00032708048820495605, -0.00030947476625442505, -0.00029186904430389404, -0.00027426332235336304, -0.00025665760040283203, -0.00023905187845230103, -0.00022144615650177002, -0.00020384043455123901, -0.000186234712600708, -0.000168628990650177, -0.000151023268699646, -0.000133417546749115, -0.00011581182479858398, -9.820610284805298e-05, -8.060038089752197e-05, -6.299465894699097e-05, -4.538893699645996e-05, -2.7783215045928955e-05, -1.017749309539795e-05, 7.428228855133057e-06, 2.5033950805664062e-05, 4.263967275619507e-05, 6.0245394706726074e-05, 7.785111665725708e-05, 9.545683860778809e-05, 0.00011306256055831909, 0.0001306682825088501, 0.0001482740044593811, 0.0001658797264099121, 0.00018348544836044312, 0.00020109117031097412, 0.00021869689226150513, 0.00023630261421203613, 0.00025390833616256714, 0.00027151405811309814, 0.00028911978006362915, 0.00030672550201416016, 0.00032433122396469116, 0.00034193694591522217, 0.0003595426678657532, 0.0003771483898162842, 0.0003947541117668152, 0.0004123598337173462, 0.0004299655556678772, 0.0004475712776184082, 0.0004651769995689392, 0.0004827827215194702, 0.0005003884434700012, 0.0005179941654205322, 0.0005355998873710632, 0.0005532056093215942, 0.0005708113312721252, 0.0005884170532226562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 11.0, 11.0, 16.0, 18.0, 39.0, 64.0, 104.0, 176.0, 263.0, 393.0, 610.0, 1051.0, 1671.0, 2603.0, 4353.0, 6943.0, 10758.0, 16799.0, 25626.0, 37872.0, 53746.0, 72404.0, 91015.0, 106797.0, 114447.0, 112520.0, 100705.0, 83670.0, 65008.0, 46966.0, 32239.0, 21582.0, 14179.0, 8942.0, 5600.0, 3524.0, 2241.0, 1329.0, 834.0, 529.0, 317.0, 200.0, 144.0, 86.0, 59.0, 39.0, 20.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.9609375, -5.7791748046875, -5.597412109375, -5.4156494140625, -5.23388671875, -5.0521240234375, -4.870361328125, -4.6885986328125, -4.5068359375, -4.3250732421875, -4.143310546875, -3.9615478515625, -3.77978515625, -3.5980224609375, -3.416259765625, -3.2344970703125, -3.052734375, -2.8709716796875, -2.689208984375, -2.5074462890625, -2.32568359375, -2.1439208984375, -1.962158203125, -1.7803955078125, -1.5986328125, -1.4168701171875, -1.235107421875, -1.0533447265625, -0.87158203125, -0.6898193359375, -0.508056640625, -0.3262939453125, -0.14453125, 0.0372314453125, 0.218994140625, 0.4007568359375, 0.58251953125, 0.7642822265625, 0.946044921875, 1.1278076171875, 1.3095703125, 1.4913330078125, 1.673095703125, 1.8548583984375, 2.03662109375, 2.2183837890625, 2.400146484375, 2.5819091796875, 2.763671875, 2.9454345703125, 3.127197265625, 3.3089599609375, 3.49072265625, 3.6724853515625, 3.854248046875, 4.0360107421875, 4.2177734375, 4.3995361328125, 4.581298828125, 4.7630615234375, 4.94482421875, 5.1265869140625, 5.308349609375, 5.4901123046875, 5.671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 6.0, 16.0, 13.0, 23.0, 16.0, 18.0, 22.0, 32.0, 38.0, 40.0, 42.0, 36.0, 55.0, 51.0, 53.0, 48.0, 48.0, 43.0, 41.0, 43.0, 41.0, 45.0, 34.0, 21.0, 19.0, 25.0, 22.0, 14.0, 15.0, 18.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.36602783203125, -2.2886962890625, -2.21136474609375, -2.134033203125, -2.05670166015625, -1.9793701171875, -1.90203857421875, -1.82470703125, -1.74737548828125, -1.6700439453125, -1.59271240234375, -1.515380859375, -1.43804931640625, -1.3607177734375, -1.28338623046875, -1.2060546875, -1.12872314453125, -1.0513916015625, -0.97406005859375, -0.896728515625, -0.81939697265625, -0.7420654296875, -0.66473388671875, -0.58740234375, -0.51007080078125, -0.4327392578125, -0.35540771484375, -0.278076171875, -0.20074462890625, -0.1234130859375, -0.04608154296875, 0.03125, 0.10858154296875, 0.1859130859375, 0.26324462890625, 0.340576171875, 0.41790771484375, 0.4952392578125, 0.57257080078125, 0.64990234375, 0.72723388671875, 0.8045654296875, 0.88189697265625, 0.959228515625, 1.03656005859375, 1.1138916015625, 1.19122314453125, 1.2685546875, 1.34588623046875, 1.4232177734375, 1.50054931640625, 1.577880859375, 1.65521240234375, 1.7325439453125, 1.80987548828125, 1.88720703125, 1.96453857421875, 2.0418701171875, 2.11920166015625, 2.196533203125, 2.27386474609375, 2.3511962890625, 2.42852783203125, 2.505859375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 11.0, 10.0, 19.0, 26.0, 28.0, 25.0, 26.0, 36.0, 55.0, 54.0, 53.0, 49.0, 42.0, 47.0, 53.0, 45.0, 56.0, 54.0, 41.0, 36.0, 36.0, 33.0, 30.0, 17.0, 24.0, 17.0, 14.0, 6.0, 11.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.304317474365234, -15.670007705688477, -15.035696983337402, -14.401386260986328, -13.76707649230957, -13.132766723632812, -12.498456001281738, -11.864145278930664, -11.229835510253906, -10.595525741577148, -9.961215019226074, -9.326904296875, -8.692594528198242, -8.058284759521484, -7.42397403717041, -6.789663791656494, -6.155353546142578, -5.521043300628662, -4.886733055114746, -4.25242280960083, -3.618112564086914, -2.983802318572998, -2.349492073059082, -1.715181827545166, -1.08087158203125, -0.446561336517334, 0.18774890899658203, 0.822059154510498, 1.456369400024414, 2.09067964553833, 2.724989891052246, 3.359300136566162, 3.993612289428711, 4.627922534942627, 5.262232780456543, 5.896543025970459, 6.530853271484375, 7.165163516998291, 7.799473762512207, 8.433784484863281, 9.068094253540039, 9.702404022216797, 10.336714744567871, 10.971025466918945, 11.605335235595703, 12.239645004272461, 12.873955726623535, 13.50826644897461, 14.142576217651367, 14.776885986328125, 15.4111967086792, 16.045507431030273, 16.67981719970703, 17.31412696838379, 17.948436737060547, 18.582748413085938, 19.217058181762695, 19.851367950439453, 20.485679626464844, 21.1199893951416, 21.75429916381836, 22.388608932495117, 23.022918701171875, 23.657230377197266, 24.291540145874023]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 13.0, 6.0, 22.0, 15.0, 17.0, 20.0, 25.0, 28.0, 26.0, 31.0, 32.0, 42.0, 35.0, 41.0, 34.0, 36.0, 33.0, 38.0, 37.0, 49.0, 44.0, 36.0, 36.0, 38.0, 42.0, 33.0, 26.0, 21.0, 27.0, 24.0, 19.0, 13.0, 14.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.219585418701172, -16.635934829711914, -16.052282333374023, -15.468631744384766, -14.884980201721191, -14.301328659057617, -13.71767807006836, -13.134026527404785, -12.550374984741211, -11.966723442077637, -11.383071899414062, -10.799421310424805, -10.21576976776123, -9.632118225097656, -9.048467636108398, -8.464816093444824, -7.88116455078125, -7.297513008117676, -6.71386194229126, -6.130210876464844, -5.5465593338012695, -4.962907791137695, -4.379256725311279, -3.7956056594848633, -3.211954116821289, -2.628302812576294, -2.044651508331299, -1.4610002040863037, -0.8773488998413086, -0.2936975955963135, 0.28995370864868164, 0.8736047744750977, 1.4572582244873047, 2.0409095287323, 2.624560832977295, 3.20821213722229, 3.791863441467285, 4.375514984130859, 4.959166049957275, 5.542817115783691, 6.126468658447266, 6.71012020111084, 7.293771266937256, 7.877422332763672, 8.461073875427246, 9.04472541809082, 9.628376007080078, 10.212027549743652, 10.795679092407227, 11.3793306350708, 11.962982177734375, 12.546632766723633, 13.130284309387207, 13.713935852050781, 14.297586441040039, 14.881237983703613, 15.464889526367188, 16.048540115356445, 16.632192611694336, 17.215843200683594, 17.799495697021484, 18.383146286010742, 18.966796875, 19.55044937133789, 20.13409996032715]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 1.0, 6.0, 19.0, 24.0, 40.0, 59.0, 102.0, 161.0, 277.0, 429.0, 741.0, 1310.0, 2063.0, 3609.0, 5925.0, 10114.0, 17438.0, 29410.0, 49737.0, 83278.0, 134706.0, 210674.0, 310590.0, 418122.0, 509877.0, 548627.0, 516619.0, 430949.0, 323118.0, 221672.0, 143593.0, 87966.0, 53442.0, 32036.0, 18925.0, 11245.0, 6857.0, 4052.0, 2503.0, 1494.0, 881.0, 584.0, 378.0, 233.0, 140.0, 99.0, 60.0, 36.0, 25.0, 15.0, 10.0, 6.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3046875, -13.8209228515625, -13.337158203125, -12.8533935546875, -12.36962890625, -11.8858642578125, -11.402099609375, -10.9183349609375, -10.4345703125, -9.9508056640625, -9.467041015625, -8.9832763671875, -8.49951171875, -8.0157470703125, -7.531982421875, -7.0482177734375, -6.564453125, -6.0806884765625, -5.596923828125, -5.1131591796875, -4.62939453125, -4.1456298828125, -3.661865234375, -3.1781005859375, -2.6943359375, -2.2105712890625, -1.726806640625, -1.2430419921875, -0.75927734375, -0.2755126953125, 0.208251953125, 0.6920166015625, 1.17578125, 1.6595458984375, 2.143310546875, 2.6270751953125, 3.11083984375, 3.5946044921875, 4.078369140625, 4.5621337890625, 5.0458984375, 5.5296630859375, 6.013427734375, 6.4971923828125, 6.98095703125, 7.4647216796875, 7.948486328125, 8.4322509765625, 8.916015625, 9.3997802734375, 9.883544921875, 10.3673095703125, 10.85107421875, 11.3348388671875, 11.818603515625, 12.3023681640625, 12.7861328125, 13.2698974609375, 13.753662109375, 14.2374267578125, 14.72119140625, 15.2049560546875, 15.688720703125, 16.1724853515625, 16.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 12.0, 16.0, 16.0, 21.0, 28.0, 23.0, 26.0, 25.0, 36.0, 37.0, 34.0, 43.0, 31.0, 36.0, 34.0, 38.0, 40.0, 43.0, 48.0, 41.0, 33.0, 39.0, 36.0, 39.0, 25.0, 33.0, 22.0, 24.0, 21.0, 17.0, 13.0, 14.0, 10.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.59375, -15.0595703125, -14.525390625, -13.9912109375, -13.45703125, -12.9228515625, -12.388671875, -11.8544921875, -11.3203125, -10.7861328125, -10.251953125, -9.7177734375, -9.18359375, -8.6494140625, -8.115234375, -7.5810546875, -7.046875, -6.5126953125, -5.978515625, -5.4443359375, -4.91015625, -4.3759765625, -3.841796875, -3.3076171875, -2.7734375, -2.2392578125, -1.705078125, -1.1708984375, -0.63671875, -0.1025390625, 0.431640625, 0.9658203125, 1.5, 2.0341796875, 2.568359375, 3.1025390625, 3.63671875, 4.1708984375, 4.705078125, 5.2392578125, 5.7734375, 6.3076171875, 6.841796875, 7.3759765625, 7.91015625, 8.4443359375, 8.978515625, 9.5126953125, 10.046875, 10.5810546875, 11.115234375, 11.6494140625, 12.18359375, 12.7177734375, 13.251953125, 13.7861328125, 14.3203125, 14.8544921875, 15.388671875, 15.9228515625, 16.45703125, 16.9912109375, 17.525390625, 18.0595703125, 18.59375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 13.0, 18.0, 34.0, 72.0, 93.0, 154.0, 260.0, 462.0, 751.0, 1374.0, 2217.0, 4093.0, 6874.0, 12342.0, 22324.0, 39411.0, 69186.0, 116740.0, 189360.0, 290220.0, 404022.0, 510330.0, 564999.0, 546947.0, 462071.0, 348309.0, 237943.0, 151430.0, 90534.0, 52357.0, 30064.0, 17088.0, 9524.0, 5381.0, 2968.0, 1828.0, 972.0, 589.0, 359.0, 233.0, 119.0, 77.0, 42.0, 48.0, 22.0, 12.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.918701171875, -16.36865234375, -15.818603515625, -15.2685546875, -14.718505859375, -14.16845703125, -13.618408203125, -13.068359375, -12.518310546875, -11.96826171875, -11.418212890625, -10.8681640625, -10.318115234375, -9.76806640625, -9.218017578125, -8.66796875, -8.117919921875, -7.56787109375, -7.017822265625, -6.4677734375, -5.917724609375, -5.36767578125, -4.817626953125, -4.267578125, -3.717529296875, -3.16748046875, -2.617431640625, -2.0673828125, -1.517333984375, -0.96728515625, -0.417236328125, 0.1328125, 0.682861328125, 1.23291015625, 1.782958984375, 2.3330078125, 2.883056640625, 3.43310546875, 3.983154296875, 4.533203125, 5.083251953125, 5.63330078125, 6.183349609375, 6.7333984375, 7.283447265625, 7.83349609375, 8.383544921875, 8.93359375, 9.483642578125, 10.03369140625, 10.583740234375, 11.1337890625, 11.683837890625, 12.23388671875, 12.783935546875, 13.333984375, 13.884033203125, 14.43408203125, 14.984130859375, 15.5341796875, 16.084228515625, 16.63427734375, 17.184326171875, 17.734375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 9.0, 13.0, 24.0, 29.0, 26.0, 42.0, 39.0, 58.0, 58.0, 60.0, 73.0, 96.0, 100.0, 111.0, 131.0, 154.0, 145.0, 164.0, 142.0, 181.0, 203.0, 201.0, 195.0, 201.0, 173.0, 165.0, 155.0, 129.0, 143.0, 119.0, 114.0, 111.0, 71.0, 89.0, 69.0, 51.0, 41.0, 37.0, 37.0, 24.0, 23.0, 13.0, 11.0, 10.0, 8.0, 2.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-7.08203125, -6.87255859375, -6.6630859375, -6.45361328125, -6.244140625, -6.03466796875, -5.8251953125, -5.61572265625, -5.40625, -5.19677734375, -4.9873046875, -4.77783203125, -4.568359375, -4.35888671875, -4.1494140625, -3.93994140625, -3.73046875, -3.52099609375, -3.3115234375, -3.10205078125, -2.892578125, -2.68310546875, -2.4736328125, -2.26416015625, -2.0546875, -1.84521484375, -1.6357421875, -1.42626953125, -1.216796875, -1.00732421875, -0.7978515625, -0.58837890625, -0.37890625, -0.16943359375, 0.0400390625, 0.24951171875, 0.458984375, 0.66845703125, 0.8779296875, 1.08740234375, 1.296875, 1.50634765625, 1.7158203125, 1.92529296875, 2.134765625, 2.34423828125, 2.5537109375, 2.76318359375, 2.97265625, 3.18212890625, 3.3916015625, 3.60107421875, 3.810546875, 4.02001953125, 4.2294921875, 4.43896484375, 4.6484375, 4.85791015625, 5.0673828125, 5.27685546875, 5.486328125, 5.69580078125, 5.9052734375, 6.11474609375, 6.32421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 3.0, 3.0, 9.0, 8.0, 10.0, 12.0, 21.0, 19.0, 30.0, 22.0, 31.0, 34.0, 32.0, 40.0, 47.0, 50.0, 42.0, 32.0, 40.0, 50.0, 41.0, 39.0, 48.0, 34.0, 33.0, 40.0, 20.0, 43.0, 22.0, 26.0, 20.0, 21.0, 17.0, 12.0, 4.0, 10.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.365427017211914, -16.807409286499023, -16.249391555786133, -15.691372871398926, -15.133354187011719, -14.575336456298828, -14.017318725585938, -13.459300994873047, -12.90128231048584, -12.34326457977295, -11.785245895385742, -11.227228164672852, -10.669210433959961, -10.111191749572754, -9.553174018859863, -8.995155334472656, -8.437137603759766, -7.879119396209717, -7.321101188659668, -6.763083457946777, -6.2050652503967285, -5.64704704284668, -5.089029312133789, -4.53101110458374, -3.9729928970336914, -3.4149746894836426, -2.856956720352173, -2.298938751220703, -1.7409205436706543, -1.1829023361206055, -0.6248843669891357, -0.06686639785766602, 0.4911518096923828, 1.049169898033142, 1.6071879863739014, 2.165205955505371, 2.72322416305542, 3.2812423706054688, 3.8392603397369385, 4.397278308868408, 4.955296516418457, 5.513314723968506, 6.071332931518555, 6.629350662231445, 7.187368869781494, 7.745387077331543, 8.303404808044434, 8.86142349243164, 9.419441223144531, 9.977458953857422, 10.535477638244629, 11.09349536895752, 11.651514053344727, 12.209531784057617, 12.767549514770508, 13.325567245483398, 13.883585929870605, 14.441603660583496, 14.999622344970703, 15.557640075683594, 16.115657806396484, 16.673675537109375, 17.2316951751709, 17.78971290588379, 18.34773063659668]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 17.0, 19.0, 18.0, 22.0, 36.0, 23.0, 35.0, 39.0, 31.0, 39.0, 35.0, 38.0, 38.0, 47.0, 50.0, 41.0, 45.0, 44.0, 36.0, 33.0, 45.0, 29.0, 35.0, 31.0, 29.0, 24.0, 19.0, 24.0, 15.0, 15.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.64324188232422, -20.98698616027832, -20.330730438232422, -19.674476623535156, -19.018220901489258, -18.36196517944336, -17.70570945739746, -17.049453735351562, -16.393198013305664, -15.736942291259766, -15.080687522888184, -14.424431800842285, -13.768176078796387, -13.111921310424805, -12.455665588378906, -11.799409866333008, -11.143155097961426, -10.486899375915527, -9.830644607543945, -9.174388885498047, -8.518133163452148, -7.861877918243408, -7.205622673034668, -6.5493669509887695, -5.893111705780029, -5.236856460571289, -4.580600738525391, -3.9243454933166504, -3.268090009689331, -2.6118345260620117, -1.9555792808532715, -1.299323558807373, -0.6430683135986328, 0.013187110424041748, 0.6694425344467163, 1.325697898864746, 1.9819533824920654, 2.6382088661193848, 3.294464111328125, 3.9507198333740234, 4.606975078582764, 5.263230323791504, 5.919486045837402, 6.575741291046143, 7.231996536254883, 7.888252258300781, 8.54450798034668, 9.200763702392578, 9.85701847076416, 10.513274192810059, 11.16952896118164, 11.825784683227539, 12.482040405273438, 13.138296127319336, 13.794550895690918, 14.450806617736816, 15.107061386108398, 15.763317108154297, 16.419572830200195, 17.075828552246094, 17.73208236694336, 18.388338088989258, 19.044593811035156, 19.700849533081055, 20.357105255126953]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 22.0, 20.0, 37.0, 57.0, 103.0, 169.0, 315.0, 458.0, 830.0, 1378.0, 2333.0, 3888.0, 6692.0, 10742.0, 17758.0, 29311.0, 46079.0, 71009.0, 102248.0, 134077.0, 150610.0, 141282.0, 111604.0, 79406.0, 52601.0, 33245.0, 20572.0, 12616.0, 7840.0, 4604.0, 2712.0, 1662.0, 908.0, 573.0, 318.0, 187.0, 120.0, 49.0, 36.0, 20.0, 14.0, 11.0, 13.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.2955322265625, -3.194580078125, -3.0936279296875, -2.99267578125, -2.8917236328125, -2.790771484375, -2.6898193359375, -2.5888671875, -2.4879150390625, -2.386962890625, -2.2860107421875, -2.18505859375, -2.0841064453125, -1.983154296875, -1.8822021484375, -1.78125, -1.6802978515625, -1.579345703125, -1.4783935546875, -1.37744140625, -1.2764892578125, -1.175537109375, -1.0745849609375, -0.9736328125, -0.8726806640625, -0.771728515625, -0.6707763671875, -0.56982421875, -0.4688720703125, -0.367919921875, -0.2669677734375, -0.166015625, -0.0650634765625, 0.035888671875, 0.1368408203125, 0.23779296875, 0.3387451171875, 0.439697265625, 0.5406494140625, 0.6416015625, 0.7425537109375, 0.843505859375, 0.9444580078125, 1.04541015625, 1.1463623046875, 1.247314453125, 1.3482666015625, 1.44921875, 1.5501708984375, 1.651123046875, 1.7520751953125, 1.85302734375, 1.9539794921875, 2.054931640625, 2.1558837890625, 2.2568359375, 2.3577880859375, 2.458740234375, 2.5596923828125, 2.66064453125, 2.7615966796875, 2.862548828125, 2.9635009765625, 3.064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 17.0, 19.0, 18.0, 23.0, 37.0, 21.0, 36.0, 39.0, 30.0, 39.0, 33.0, 39.0, 40.0, 47.0, 49.0, 41.0, 45.0, 43.0, 38.0, 34.0, 44.0, 31.0, 33.0, 31.0, 29.0, 23.0, 22.0, 21.0, 15.0, 17.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.06005859375, -20.4013671875, -19.74267578125, -19.083984375, -18.42529296875, -17.7666015625, -17.10791015625, -16.44921875, -15.79052734375, -15.1318359375, -14.47314453125, -13.814453125, -13.15576171875, -12.4970703125, -11.83837890625, -11.1796875, -10.52099609375, -9.8623046875, -9.20361328125, -8.544921875, -7.88623046875, -7.2275390625, -6.56884765625, -5.91015625, -5.25146484375, -4.5927734375, -3.93408203125, -3.275390625, -2.61669921875, -1.9580078125, -1.29931640625, -0.640625, 0.01806640625, 0.6767578125, 1.33544921875, 1.994140625, 2.65283203125, 3.3115234375, 3.97021484375, 4.62890625, 5.28759765625, 5.9462890625, 6.60498046875, 7.263671875, 7.92236328125, 8.5810546875, 9.23974609375, 9.8984375, 10.55712890625, 11.2158203125, 11.87451171875, 12.533203125, 13.19189453125, 13.8505859375, 14.50927734375, 15.16796875, 15.82666015625, 16.4853515625, 17.14404296875, 17.802734375, 18.46142578125, 19.1201171875, 19.77880859375, 20.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 18.0, 24.0, 47.0, 58.0, 84.0, 137.0, 197.0, 338.0, 493.0, 833.0, 1335.0, 2125.0, 3423.0, 5729.0, 9450.0, 16209.0, 31707.0, 295619.0, 597126.0, 38278.0, 18552.0, 10534.0, 6214.0, 3781.0, 2273.0, 1453.0, 898.0, 571.0, 388.0, 210.0, 131.0, 93.0, 68.0, 38.0, 33.0, 18.0, 17.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.9974365234375, -5.776123046875, -5.5548095703125, -5.33349609375, -5.1121826171875, -4.890869140625, -4.6695556640625, -4.4482421875, -4.2269287109375, -4.005615234375, -3.7843017578125, -3.56298828125, -3.3416748046875, -3.120361328125, -2.8990478515625, -2.677734375, -2.4564208984375, -2.235107421875, -2.0137939453125, -1.79248046875, -1.5711669921875, -1.349853515625, -1.1285400390625, -0.9072265625, -0.6859130859375, -0.464599609375, -0.2432861328125, -0.02197265625, 0.1993408203125, 0.420654296875, 0.6419677734375, 0.86328125, 1.0845947265625, 1.305908203125, 1.5272216796875, 1.74853515625, 1.9698486328125, 2.191162109375, 2.4124755859375, 2.6337890625, 2.8551025390625, 3.076416015625, 3.2977294921875, 3.51904296875, 3.7403564453125, 3.961669921875, 4.1829833984375, 4.404296875, 4.6256103515625, 4.846923828125, 5.0682373046875, 5.28955078125, 5.5108642578125, 5.732177734375, 5.9534912109375, 6.1748046875, 6.3961181640625, 6.617431640625, 6.8387451171875, 7.06005859375, 7.2813720703125, 7.502685546875, 7.7239990234375, 7.9453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 8.0, 8.0, 15.0, 12.0, 8.0, 21.0, 29.0, 28.0, 29.0, 45.0, 38.0, 38.0, 45.0, 33.0, 43.0, 53.0, 49.0, 47.0, 50.0, 42.0, 33.0, 27.0, 31.0, 30.0, 38.0, 30.0, 28.0, 24.0, 12.0, 22.0, 17.0, 10.0, 10.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.4921875, -14.0631103515625, -13.634033203125, -13.2049560546875, -12.77587890625, -12.3468017578125, -11.917724609375, -11.4886474609375, -11.0595703125, -10.6304931640625, -10.201416015625, -9.7723388671875, -9.34326171875, -8.9141845703125, -8.485107421875, -8.0560302734375, -7.626953125, -7.1978759765625, -6.768798828125, -6.3397216796875, -5.91064453125, -5.4815673828125, -5.052490234375, -4.6234130859375, -4.1943359375, -3.7652587890625, -3.336181640625, -2.9071044921875, -2.47802734375, -2.0489501953125, -1.619873046875, -1.1907958984375, -0.76171875, -0.3326416015625, 0.096435546875, 0.5255126953125, 0.95458984375, 1.3836669921875, 1.812744140625, 2.2418212890625, 2.6708984375, 3.0999755859375, 3.529052734375, 3.9581298828125, 4.38720703125, 4.8162841796875, 5.245361328125, 5.6744384765625, 6.103515625, 6.5325927734375, 6.961669921875, 7.3907470703125, 7.81982421875, 8.2489013671875, 8.677978515625, 9.1070556640625, 9.5361328125, 9.9652099609375, 10.394287109375, 10.8233642578125, 11.25244140625, 11.6815185546875, 12.110595703125, 12.5396728515625, 12.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 16.0, 34.0, 37.0, 43.0, 62.0, 121.0, 147.0, 199.0, 280.0, 451.0, 616.0, 931.0, 1319.0, 1963.0, 3149.0, 4866.0, 7063.0, 11170.0, 17711.0, 29397.0, 320520.0, 562504.0, 32418.0, 18903.0, 11904.0, 7624.0, 4808.0, 3429.0, 2276.0, 1497.0, 942.0, 642.0, 468.0, 298.0, 198.0, 154.0, 110.0, 72.0, 50.0, 38.0, 17.0, 18.0, 17.0, 13.0, 5.0, 7.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.5634765625, -0.5464401245117188, -0.5294036865234375, -0.5123672485351562, -0.495330810546875, -0.47829437255859375, -0.4612579345703125, -0.44422149658203125, -0.42718505859375, -0.41014862060546875, -0.3931121826171875, -0.37607574462890625, -0.359039306640625, -0.34200286865234375, -0.3249664306640625, -0.30792999267578125, -0.2908935546875, -0.27385711669921875, -0.2568206787109375, -0.23978424072265625, -0.222747802734375, -0.20571136474609375, -0.1886749267578125, -0.17163848876953125, -0.15460205078125, -0.13756561279296875, -0.1205291748046875, -0.10349273681640625, -0.086456298828125, -0.06941986083984375, -0.0523834228515625, -0.03534698486328125, -0.018310546875, -0.00127410888671875, 0.0157623291015625, 0.03279876708984375, 0.049835205078125, 0.06687164306640625, 0.0839080810546875, 0.10094451904296875, 0.11798095703125, 0.13501739501953125, 0.1520538330078125, 0.16909027099609375, 0.186126708984375, 0.20316314697265625, 0.2201995849609375, 0.23723602294921875, 0.2542724609375, 0.27130889892578125, 0.2883453369140625, 0.30538177490234375, 0.322418212890625, 0.33945465087890625, 0.3564910888671875, 0.37352752685546875, 0.39056396484375, 0.40760040283203125, 0.4246368408203125, 0.44167327880859375, 0.458709716796875, 0.47574615478515625, 0.4927825927734375, 0.5098190307617188, 0.52685546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 6.0, 14.0, 15.0, 16.0, 26.0, 25.0, 30.0, 40.0, 27.0, 33.0, 43.0, 46.0, 47.0, 65.0, 53.0, 55.0, 53.0, 51.0, 35.0, 36.0, 33.0, 42.0, 31.0, 32.0, 27.0, 16.0, 19.0, 15.0, 13.0, 10.0, 8.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7337501049041748e-05, -1.6614794731140137e-05, -1.5892088413238525e-05, -1.5169382095336914e-05, -1.4446675777435303e-05, -1.3723969459533691e-05, -1.300126314163208e-05, -1.2278556823730469e-05, -1.1555850505828857e-05, -1.0833144187927246e-05, -1.0110437870025635e-05, -9.387731552124023e-06, -8.665025234222412e-06, -7.9423189163208e-06, -7.2196125984191895e-06, -6.496906280517578e-06, -5.774199962615967e-06, -5.0514936447143555e-06, -4.328787326812744e-06, -3.606081008911133e-06, -2.8833746910095215e-06, -2.16066837310791e-06, -1.4379620552062988e-06, -7.152557373046875e-07, 7.450580596923828e-09, 7.301568984985352e-07, 1.4528632164001465e-06, 2.175569534301758e-06, 2.898275852203369e-06, 3.6209821701049805e-06, 4.343688488006592e-06, 5.066394805908203e-06, 5.7891011238098145e-06, 6.511807441711426e-06, 7.234513759613037e-06, 7.957220077514648e-06, 8.67992639541626e-06, 9.402632713317871e-06, 1.0125339031219482e-05, 1.0848045349121094e-05, 1.1570751667022705e-05, 1.2293457984924316e-05, 1.3016164302825928e-05, 1.3738870620727539e-05, 1.446157693862915e-05, 1.5184283256530762e-05, 1.5906989574432373e-05, 1.6629695892333984e-05, 1.7352402210235596e-05, 1.8075108528137207e-05, 1.879781484603882e-05, 1.952052116394043e-05, 2.024322748184204e-05, 2.0965933799743652e-05, 2.1688640117645264e-05, 2.2411346435546875e-05, 2.3134052753448486e-05, 2.3856759071350098e-05, 2.457946538925171e-05, 2.530217170715332e-05, 2.602487802505493e-05, 2.6747584342956543e-05, 2.7470290660858154e-05, 2.8192996978759766e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 15.0, 21.0, 16.0, 54.0, 68.0, 98.0, 164.0, 245.0, 395.0, 657.0, 991.0, 1654.0, 2684.0, 4121.0, 6520.0, 10136.0, 16386.0, 25182.0, 39243.0, 60391.0, 89513.0, 125660.0, 155540.0, 151372.0, 118591.0, 83568.0, 55677.0, 36333.0, 23012.0, 14677.0, 9211.0, 6087.0, 3942.0, 2397.0, 1443.0, 940.0, 591.0, 366.0, 203.0, 148.0, 88.0, 47.0, 28.0, 21.0, 15.0, 13.0, 10.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5434494018554688, -0.5258636474609375, -0.5082778930664062, -0.490692138671875, -0.47310638427734375, -0.4555206298828125, -0.43793487548828125, -0.42034912109375, -0.40276336669921875, -0.3851776123046875, -0.36759185791015625, -0.350006103515625, -0.33242034912109375, -0.3148345947265625, -0.29724884033203125, -0.2796630859375, -0.26207733154296875, -0.2444915771484375, -0.22690582275390625, -0.209320068359375, -0.19173431396484375, -0.1741485595703125, -0.15656280517578125, -0.13897705078125, -0.12139129638671875, -0.1038055419921875, -0.08621978759765625, -0.068634033203125, -0.05104827880859375, -0.0334625244140625, -0.01587677001953125, 0.001708984375, 0.01929473876953125, 0.0368804931640625, 0.05446624755859375, 0.072052001953125, 0.08963775634765625, 0.1072235107421875, 0.12480926513671875, 0.14239501953125, 0.15998077392578125, 0.1775665283203125, 0.19515228271484375, 0.212738037109375, 0.23032379150390625, 0.2479095458984375, 0.26549530029296875, 0.2830810546875, 0.30066680908203125, 0.3182525634765625, 0.33583831787109375, 0.353424072265625, 0.37100982666015625, 0.3885955810546875, 0.40618133544921875, 0.42376708984375, 0.44135284423828125, 0.4589385986328125, 0.47652435302734375, 0.494110107421875, 0.5116958618164062, 0.5292816162109375, 0.5468673706054688, 0.564453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 4.0, 7.0, 9.0, 13.0, 22.0, 12.0, 14.0, 29.0, 22.0, 39.0, 39.0, 57.0, 60.0, 56.0, 63.0, 78.0, 70.0, 46.0, 62.0, 38.0, 47.0, 34.0, 32.0, 24.0, 22.0, 19.0, 15.0, 13.0, 7.0, 4.0, 10.0, 3.0, 2.0, 4.0, 3.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2327880859375, -0.22540283203125, -0.218017578125, -0.21063232421875, -0.2032470703125, -0.19586181640625, -0.1884765625, -0.18109130859375, -0.1737060546875, -0.16632080078125, -0.158935546875, -0.15155029296875, -0.1441650390625, -0.13677978515625, -0.12939453125, -0.12200927734375, -0.1146240234375, -0.10723876953125, -0.099853515625, -0.09246826171875, -0.0850830078125, -0.07769775390625, -0.0703125, -0.06292724609375, -0.0555419921875, -0.04815673828125, -0.040771484375, -0.03338623046875, -0.0260009765625, -0.01861572265625, -0.01123046875, -0.00384521484375, 0.0035400390625, 0.01092529296875, 0.018310546875, 0.02569580078125, 0.0330810546875, 0.04046630859375, 0.0478515625, 0.05523681640625, 0.0626220703125, 0.07000732421875, 0.077392578125, 0.08477783203125, 0.0921630859375, 0.09954833984375, 0.10693359375, 0.11431884765625, 0.1217041015625, 0.12908935546875, 0.136474609375, 0.14385986328125, 0.1512451171875, 0.15863037109375, 0.166015625, 0.17340087890625, 0.1807861328125, 0.18817138671875, 0.195556640625, 0.20294189453125, 0.2103271484375, 0.21771240234375, 0.22509765625, 0.23248291015625, 0.2398681640625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 3.0, 11.0, 9.0, 14.0, 13.0, 21.0, 23.0, 22.0, 30.0, 32.0, 29.0, 38.0, 48.0, 40.0, 45.0, 39.0, 39.0, 35.0, 50.0, 33.0, 50.0, 43.0, 30.0, 37.0, 37.0, 33.0, 27.0, 18.0, 27.0, 25.0, 14.0, 17.0, 11.0, 7.0, 11.0, 5.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92188262939453, -16.3713321685791, -15.820782661437988, -15.270232200622559, -14.719682693481445, -14.169132232666016, -13.618581771850586, -13.068031311035156, -12.517481803894043, -11.966931343078613, -11.4163818359375, -10.86583137512207, -10.31528091430664, -9.764731407165527, -9.214180946350098, -8.663631439208984, -8.113080978393555, -7.562530994415283, -7.011981010437012, -6.461430549621582, -5.9108805656433105, -5.360330581665039, -4.809780120849609, -4.259230136871338, -3.7086801528930664, -3.158130168914795, -2.6075799465179443, -2.0570297241210938, -1.5064797401428223, -0.9559297561645508, -0.4053795337677002, 0.1451706886291504, 0.6957187652587891, 1.24626886844635, 1.7968189716339111, 2.3473691940307617, 2.897919178009033, 3.4484691619873047, 3.9990193843841553, 4.549569606781006, 5.100119590759277, 5.650669574737549, 6.20121955871582, 6.75177001953125, 7.3023200035095215, 7.852869987487793, 8.403420448303223, 8.953969955444336, 9.504520416259766, 10.055070877075195, 10.605620384216309, 11.156170845031738, 11.706720352172852, 12.257270812988281, 12.807821273803711, 13.35837173461914, 13.908921241760254, 14.459471702575684, 15.010021209716797, 15.560571670532227, 16.111122131347656, 16.661670684814453, 17.212221145629883, 17.762771606445312, 18.313322067260742]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 17.0, 19.0, 20.0, 20.0, 38.0, 21.0, 37.0, 38.0, 29.0, 41.0, 32.0, 41.0, 37.0, 43.0, 51.0, 44.0, 45.0, 40.0, 41.0, 34.0, 43.0, 32.0, 31.0, 32.0, 27.0, 24.0, 21.0, 22.0, 16.0, 16.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.68993377685547, -21.03296661376953, -20.375999450683594, -19.719032287597656, -19.06206512451172, -18.40509796142578, -17.748130798339844, -17.091163635253906, -16.43419647216797, -15.777229309082031, -15.120262145996094, -14.463294982910156, -13.806327819824219, -13.149360656738281, -12.492393493652344, -11.835426330566406, -11.178460121154785, -10.521492958068848, -9.86452579498291, -9.207558631896973, -8.550591468811035, -7.893624305725098, -7.236657619476318, -6.579690456390381, -5.922723293304443, -5.265756130218506, -4.608788967132568, -3.95182204246521, -3.2948548793792725, -2.637887716293335, -1.9809207916259766, -1.323953628540039, -0.6669864654541016, -0.010019361972808838, 0.6469477415084839, 1.3039147853851318, 1.9608819484710693, 2.617849111557007, 3.2748160362243652, 3.9317831993103027, 4.58875036239624, 5.245717525482178, 5.902684688568115, 6.5596513748168945, 7.216618537902832, 7.8735857009887695, 8.530552864074707, 9.187520027160645, 9.844487190246582, 10.50145435333252, 11.158421516418457, 11.815388679504395, 12.472355842590332, 13.12932300567627, 13.78628921508789, 14.443256378173828, 15.100223541259766, 15.757190704345703, 16.41415786743164, 17.071125030517578, 17.728092193603516, 18.385059356689453, 19.04202651977539, 19.698993682861328, 20.355960845947266]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 14.0, 23.0, 32.0, 55.0, 96.0, 152.0, 226.0, 340.0, 548.0, 1010.0, 1548.0, 2396.0, 3775.0, 5978.0, 9169.0, 13617.0, 19853.0, 28497.0, 38880.0, 52197.0, 66791.0, 80366.0, 91256.0, 97989.0, 97979.0, 93565.0, 82487.0, 68880.0, 54945.0, 41867.0, 30798.0, 21193.0, 14668.0, 9915.0, 6273.0, 4013.0, 2681.0, 1644.0, 1069.0, 672.0, 384.0, 257.0, 165.0, 118.0, 61.0, 36.0, 29.0, 17.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1015625, -11.71240234375, -11.3232421875, -10.93408203125, -10.544921875, -10.15576171875, -9.7666015625, -9.37744140625, -8.98828125, -8.59912109375, -8.2099609375, -7.82080078125, -7.431640625, -7.04248046875, -6.6533203125, -6.26416015625, -5.875, -5.48583984375, -5.0966796875, -4.70751953125, -4.318359375, -3.92919921875, -3.5400390625, -3.15087890625, -2.76171875, -2.37255859375, -1.9833984375, -1.59423828125, -1.205078125, -0.81591796875, -0.4267578125, -0.03759765625, 0.3515625, 0.74072265625, 1.1298828125, 1.51904296875, 1.908203125, 2.29736328125, 2.6865234375, 3.07568359375, 3.46484375, 3.85400390625, 4.2431640625, 4.63232421875, 5.021484375, 5.41064453125, 5.7998046875, 6.18896484375, 6.578125, 6.96728515625, 7.3564453125, 7.74560546875, 8.134765625, 8.52392578125, 8.9130859375, 9.30224609375, 9.69140625, 10.08056640625, 10.4697265625, 10.85888671875, 11.248046875, 11.63720703125, 12.0263671875, 12.41552734375, 12.8046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 12.0, 12.0, 21.0, 20.0, 20.0, 34.0, 23.0, 35.0, 43.0, 32.0, 38.0, 32.0, 38.0, 42.0, 44.0, 48.0, 47.0, 43.0, 39.0, 40.0, 35.0, 47.0, 29.0, 35.0, 32.0, 24.0, 23.0, 22.0, 22.0, 18.0, 12.0, 11.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.362548828125, -19.72509765625, -19.087646484375, -18.4501953125, -17.812744140625, -17.17529296875, -16.537841796875, -15.900390625, -15.262939453125, -14.62548828125, -13.988037109375, -13.3505859375, -12.713134765625, -12.07568359375, -11.438232421875, -10.80078125, -10.163330078125, -9.52587890625, -8.888427734375, -8.2509765625, -7.613525390625, -6.97607421875, -6.338623046875, -5.701171875, -5.063720703125, -4.42626953125, -3.788818359375, -3.1513671875, -2.513916015625, -1.87646484375, -1.239013671875, -0.6015625, 0.035888671875, 0.67333984375, 1.310791015625, 1.9482421875, 2.585693359375, 3.22314453125, 3.860595703125, 4.498046875, 5.135498046875, 5.77294921875, 6.410400390625, 7.0478515625, 7.685302734375, 8.32275390625, 8.960205078125, 9.59765625, 10.235107421875, 10.87255859375, 11.510009765625, 12.1474609375, 12.784912109375, 13.42236328125, 14.059814453125, 14.697265625, 15.334716796875, 15.97216796875, 16.609619140625, 17.2470703125, 17.884521484375, 18.52197265625, 19.159423828125, 19.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 15.0, 21.0, 40.0, 59.0, 100.0, 170.0, 249.0, 410.0, 648.0, 1127.0, 1728.0, 2995.0, 4523.0, 7190.0, 11108.0, 16643.0, 24416.0, 34742.0, 47413.0, 62172.0, 77512.0, 91386.0, 99675.0, 102630.0, 98197.0, 87870.0, 73960.0, 59360.0, 44927.0, 31962.0, 22310.0, 15347.0, 10065.0, 6528.0, 4137.0, 2554.0, 1683.0, 1087.0, 644.0, 390.0, 219.0, 125.0, 87.0, 52.0, 23.0, 15.0, 14.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.955078125, -11.57421875, -11.193359375, -10.8125, -10.431640625, -10.05078125, -9.669921875, -9.2890625, -8.908203125, -8.52734375, -8.146484375, -7.765625, -7.384765625, -7.00390625, -6.623046875, -6.2421875, -5.861328125, -5.48046875, -5.099609375, -4.71875, -4.337890625, -3.95703125, -3.576171875, -3.1953125, -2.814453125, -2.43359375, -2.052734375, -1.671875, -1.291015625, -0.91015625, -0.529296875, -0.1484375, 0.232421875, 0.61328125, 0.994140625, 1.375, 1.755859375, 2.13671875, 2.517578125, 2.8984375, 3.279296875, 3.66015625, 4.041015625, 4.421875, 4.802734375, 5.18359375, 5.564453125, 5.9453125, 6.326171875, 6.70703125, 7.087890625, 7.46875, 7.849609375, 8.23046875, 8.611328125, 8.9921875, 9.373046875, 9.75390625, 10.134765625, 10.515625, 10.896484375, 11.27734375, 11.658203125, 12.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 14.0, 15.0, 22.0, 22.0, 22.0, 27.0, 30.0, 32.0, 27.0, 37.0, 43.0, 31.0, 43.0, 49.0, 61.0, 41.0, 36.0, 48.0, 39.0, 37.0, 40.0, 36.0, 24.0, 26.0, 19.0, 27.0, 20.0, 23.0, 16.0, 16.0, 14.0, 10.0, 5.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2449951171875, -10.849365234375, -10.4537353515625, -10.05810546875, -9.6624755859375, -9.266845703125, -8.8712158203125, -8.4755859375, -8.0799560546875, -7.684326171875, -7.2886962890625, -6.89306640625, -6.4974365234375, -6.101806640625, -5.7061767578125, -5.310546875, -4.9149169921875, -4.519287109375, -4.1236572265625, -3.72802734375, -3.3323974609375, -2.936767578125, -2.5411376953125, -2.1455078125, -1.7498779296875, -1.354248046875, -0.9586181640625, -0.56298828125, -0.1673583984375, 0.228271484375, 0.6239013671875, 1.01953125, 1.4151611328125, 1.810791015625, 2.2064208984375, 2.60205078125, 2.9976806640625, 3.393310546875, 3.7889404296875, 4.1845703125, 4.5802001953125, 4.975830078125, 5.3714599609375, 5.76708984375, 6.1627197265625, 6.558349609375, 6.9539794921875, 7.349609375, 7.7452392578125, 8.140869140625, 8.5364990234375, 8.93212890625, 9.3277587890625, 9.723388671875, 10.1190185546875, 10.5146484375, 10.9102783203125, 11.305908203125, 11.7015380859375, 12.09716796875, 12.4927978515625, 12.888427734375, 13.2840576171875, 13.6796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 10.0, 12.0, 20.0, 30.0, 41.0, 62.0, 111.0, 158.0, 321.0, 453.0, 734.0, 1183.0, 1794.0, 2908.0, 4596.0, 7214.0, 10940.0, 16250.0, 24170.0, 34507.0, 47299.0, 62390.0, 77281.0, 91070.0, 100103.0, 103260.0, 99180.0, 87970.0, 73811.0, 59192.0, 44631.0, 32052.0, 22460.0, 14857.0, 9792.0, 6512.0, 4107.0, 2694.0, 1612.0, 1073.0, 647.0, 387.0, 235.0, 162.0, 101.0, 71.0, 38.0, 25.0, 17.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.60906982421875, -4.4407958984375, -4.27252197265625, -4.104248046875, -3.93597412109375, -3.7677001953125, -3.59942626953125, -3.43115234375, -3.26287841796875, -3.0946044921875, -2.92633056640625, -2.758056640625, -2.58978271484375, -2.4215087890625, -2.25323486328125, -2.0849609375, -1.91668701171875, -1.7484130859375, -1.58013916015625, -1.411865234375, -1.24359130859375, -1.0753173828125, -0.90704345703125, -0.73876953125, -0.57049560546875, -0.4022216796875, -0.23394775390625, -0.065673828125, 0.10260009765625, 0.2708740234375, 0.43914794921875, 0.607421875, 0.77569580078125, 0.9439697265625, 1.11224365234375, 1.280517578125, 1.44879150390625, 1.6170654296875, 1.78533935546875, 1.95361328125, 2.12188720703125, 2.2901611328125, 2.45843505859375, 2.626708984375, 2.79498291015625, 2.9632568359375, 3.13153076171875, 3.2998046875, 3.46807861328125, 3.6363525390625, 3.80462646484375, 3.972900390625, 4.14117431640625, 4.3094482421875, 4.47772216796875, 4.64599609375, 4.81427001953125, 4.9825439453125, 5.15081787109375, 5.319091796875, 5.48736572265625, 5.6556396484375, 5.82391357421875, 5.9921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 8.0, 8.0, 13.0, 9.0, 17.0, 21.0, 25.0, 25.0, 23.0, 33.0, 44.0, 33.0, 37.0, 33.0, 57.0, 49.0, 47.0, 42.0, 49.0, 47.0, 40.0, 43.0, 39.0, 32.0, 28.0, 31.0, 28.0, 20.0, 11.0, 18.0, 10.0, 11.0, 4.0, 8.0, 2.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00074005126953125, -0.0007163435220718384, -0.0006926357746124268, -0.0006689280271530151, -0.0006452202796936035, -0.0006215125322341919, -0.0005978047847747803, -0.0005740970373153687, -0.000550389289855957, -0.0005266815423965454, -0.0005029737949371338, -0.00047926604747772217, -0.00045555830001831055, -0.0004318505525588989, -0.0004081428050994873, -0.0003844350576400757, -0.00036072731018066406, -0.00033701956272125244, -0.0003133118152618408, -0.0002896040678024292, -0.0002658963203430176, -0.00024218857288360596, -0.00021848082542419434, -0.00019477307796478271, -0.0001710653305053711, -0.00014735758304595947, -0.00012364983558654785, -9.994208812713623e-05, -7.623434066772461e-05, -5.252659320831299e-05, -2.8818845748901367e-05, -5.111098289489746e-06, 1.8596649169921875e-05, 4.2304396629333496e-05, 6.601214408874512e-05, 8.971989154815674e-05, 0.00011342763900756836, 0.00013713538646697998, 0.0001608431339263916, 0.00018455088138580322, 0.00020825862884521484, 0.00023196637630462646, 0.0002556741237640381, 0.0002793818712234497, 0.00030308961868286133, 0.00032679736614227295, 0.00035050511360168457, 0.0003742128610610962, 0.0003979206085205078, 0.00042162835597991943, 0.00044533610343933105, 0.0004690438508987427, 0.0004927515983581543, 0.0005164593458175659, 0.0005401670932769775, 0.0005638748407363892, 0.0005875825881958008, 0.0006112903356552124, 0.000634998083114624, 0.0006587058305740356, 0.0006824135780334473, 0.0007061213254928589, 0.0007298290729522705, 0.0007535368204116821, 0.0007772445678710938]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 13.0, 25.0, 24.0, 42.0, 40.0, 84.0, 124.0, 197.0, 334.0, 478.0, 714.0, 1207.0, 1904.0, 3040.0, 4642.0, 7268.0, 10984.0, 16501.0, 24474.0, 34992.0, 47878.0, 62982.0, 78647.0, 92110.0, 101220.0, 103942.0, 98652.0, 87921.0, 73706.0, 57361.0, 43026.0, 30987.0, 21846.0, 14264.0, 9600.0, 6261.0, 4089.0, 2534.0, 1707.0, 1034.0, 618.0, 424.0, 226.0, 149.0, 101.0, 60.0, 37.0, 31.0, 21.0, 10.0, 11.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.6458740234375, -5.459716796875, -5.2735595703125, -5.08740234375, -4.9012451171875, -4.715087890625, -4.5289306640625, -4.3427734375, -4.1566162109375, -3.970458984375, -3.7843017578125, -3.59814453125, -3.4119873046875, -3.225830078125, -3.0396728515625, -2.853515625, -2.6673583984375, -2.481201171875, -2.2950439453125, -2.10888671875, -1.9227294921875, -1.736572265625, -1.5504150390625, -1.3642578125, -1.1781005859375, -0.991943359375, -0.8057861328125, -0.61962890625, -0.4334716796875, -0.247314453125, -0.0611572265625, 0.125, 0.3111572265625, 0.497314453125, 0.6834716796875, 0.86962890625, 1.0557861328125, 1.241943359375, 1.4281005859375, 1.6142578125, 1.8004150390625, 1.986572265625, 2.1727294921875, 2.35888671875, 2.5450439453125, 2.731201171875, 2.9173583984375, 3.103515625, 3.2896728515625, 3.475830078125, 3.6619873046875, 3.84814453125, 4.0343017578125, 4.220458984375, 4.4066162109375, 4.5927734375, 4.7789306640625, 4.965087890625, 5.1512451171875, 5.33740234375, 5.5235595703125, 5.709716796875, 5.8958740234375, 6.08203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 12.0, 8.0, 14.0, 21.0, 21.0, 30.0, 31.0, 42.0, 64.0, 41.0, 58.0, 69.0, 72.0, 55.0, 68.0, 60.0, 64.0, 45.0, 41.0, 36.0, 36.0, 20.0, 25.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2105712890625, -4.089111328125, -3.9676513671875, -3.84619140625, -3.7247314453125, -3.603271484375, -3.4818115234375, -3.3603515625, -3.2388916015625, -3.117431640625, -2.9959716796875, -2.87451171875, -2.7530517578125, -2.631591796875, -2.5101318359375, -2.388671875, -2.2672119140625, -2.145751953125, -2.0242919921875, -1.90283203125, -1.7813720703125, -1.659912109375, -1.5384521484375, -1.4169921875, -1.2955322265625, -1.174072265625, -1.0526123046875, -0.93115234375, -0.8096923828125, -0.688232421875, -0.5667724609375, -0.4453125, -0.3238525390625, -0.202392578125, -0.0809326171875, 0.04052734375, 0.1619873046875, 0.283447265625, 0.4049072265625, 0.5263671875, 0.6478271484375, 0.769287109375, 0.8907470703125, 1.01220703125, 1.1336669921875, 1.255126953125, 1.3765869140625, 1.498046875, 1.6195068359375, 1.740966796875, 1.8624267578125, 1.98388671875, 2.1053466796875, 2.226806640625, 2.3482666015625, 2.4697265625, 2.5911865234375, 2.712646484375, 2.8341064453125, 2.95556640625, 3.0770263671875, 3.198486328125, 3.3199462890625, 3.44140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 12.0, 14.0, 15.0, 21.0, 12.0, 27.0, 25.0, 27.0, 31.0, 41.0, 35.0, 31.0, 33.0, 43.0, 48.0, 34.0, 46.0, 35.0, 39.0, 35.0, 38.0, 42.0, 32.0, 33.0, 29.0, 25.0, 22.0, 26.0, 17.0, 13.0, 10.0, 23.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4219970703125, -14.90878677368164, -14.395577430725098, -13.882367134094238, -13.369157791137695, -12.855947494506836, -12.342737197875977, -11.829526901245117, -11.316317558288574, -10.803107261657715, -10.289897918701172, -9.776687622070312, -9.263477325439453, -8.75026798248291, -8.23705768585205, -7.72384786605835, -7.210638046264648, -6.697428226470947, -6.184218406677246, -5.671008110046387, -5.1577982902526855, -4.644588470458984, -4.131378173828125, -3.618168354034424, -3.1049585342407227, -2.5917487144470215, -2.078538656234741, -1.5653287172317505, -1.0521187782287598, -0.5389089584350586, -0.02569890022277832, 0.48751115798950195, 1.0007190704345703, 1.513929009437561, 2.0271389484405518, 2.540349006652832, 3.053558826446533, 3.5667686462402344, 4.079978942871094, 4.593188762664795, 5.106398582458496, 5.619608402252197, 6.132818222045898, 6.646028518676758, 7.159238338470459, 7.67244815826416, 8.18565845489502, 8.698867797851562, 9.212078094482422, 9.725288391113281, 10.238497734069824, 10.751708030700684, 11.264917373657227, 11.778127670288086, 12.291337966918945, 12.804548263549805, 13.317757606506348, 13.830967903137207, 14.34417724609375, 14.85738754272461, 15.370597839355469, 15.883807182312012, 16.397016525268555, 16.910226821899414, 17.423437118530273]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 13.0, 14.0, 17.0, 25.0, 22.0, 25.0, 24.0, 28.0, 30.0, 42.0, 33.0, 32.0, 29.0, 43.0, 53.0, 35.0, 41.0, 41.0, 41.0, 44.0, 40.0, 42.0, 23.0, 35.0, 22.0, 32.0, 33.0, 22.0, 24.0, 12.0, 10.0, 13.0, 14.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.436277389526367, -20.79283332824707, -20.149389266967773, -19.505943298339844, -18.862499237060547, -18.21905517578125, -17.575611114501953, -16.932167053222656, -16.28872299194336, -15.645278930664062, -15.00183391571045, -14.358389854431152, -13.714944839477539, -13.071500778198242, -12.428056716918945, -11.784612655639648, -11.141166687011719, -10.497722625732422, -9.854277610778809, -9.210833549499512, -8.567388534545898, -7.923944473266602, -7.280500411987305, -6.63705587387085, -5.9936113357543945, -5.3501667976379395, -4.706722259521484, -4.0632781982421875, -3.4198336601257324, -2.7763891220092773, -2.1329448223114014, -1.4895005226135254, -0.8460559844970703, -0.20261156558990479, 0.44083285331726074, 1.0842772722244263, 1.7277216911315918, 2.371166229248047, 3.014610528945923, 3.658054828643799, 4.301499366760254, 4.944943904876709, 5.588388442993164, 6.231832504272461, 6.875277042388916, 7.518721580505371, 8.162165641784668, 8.805610656738281, 9.449054718017578, 10.092498779296875, 10.735943794250488, 11.379387855529785, 12.022832870483398, 12.666276931762695, 13.309720993041992, 13.953165054321289, 14.596610069274902, 15.2400541305542, 15.883499145507812, 16.52694320678711, 17.170387268066406, 17.813831329345703, 18.457277297973633, 19.10072135925293, 19.744165420532227]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 6.0, 11.0, 22.0, 45.0, 61.0, 92.0, 125.0, 198.0, 342.0, 559.0, 981.0, 1673.0, 3041.0, 5272.0, 9436.0, 17040.0, 30958.0, 54510.0, 96254.0, 162769.0, 262390.0, 389506.0, 517816.0, 595921.0, 587387.0, 496229.0, 365946.0, 242342.0, 149431.0, 87441.0, 50190.0, 28201.0, 16191.0, 9286.0, 5233.0, 3001.0, 1757.0, 1040.0, 609.0, 356.0, 216.0, 122.0, 99.0, 55.0, 36.0, 29.0, 21.0, 6.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.1875, -15.646484375, -15.10546875, -14.564453125, -14.0234375, -13.482421875, -12.94140625, -12.400390625, -11.859375, -11.318359375, -10.77734375, -10.236328125, -9.6953125, -9.154296875, -8.61328125, -8.072265625, -7.53125, -6.990234375, -6.44921875, -5.908203125, -5.3671875, -4.826171875, -4.28515625, -3.744140625, -3.203125, -2.662109375, -2.12109375, -1.580078125, -1.0390625, -0.498046875, 0.04296875, 0.583984375, 1.125, 1.666015625, 2.20703125, 2.748046875, 3.2890625, 3.830078125, 4.37109375, 4.912109375, 5.453125, 5.994140625, 6.53515625, 7.076171875, 7.6171875, 8.158203125, 8.69921875, 9.240234375, 9.78125, 10.322265625, 10.86328125, 11.404296875, 11.9453125, 12.486328125, 13.02734375, 13.568359375, 14.109375, 14.650390625, 15.19140625, 15.732421875, 16.2734375, 16.814453125, 17.35546875, 17.896484375, 18.4375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 7.0, 11.0, 12.0, 16.0, 14.0, 26.0, 21.0, 25.0, 26.0, 25.0, 36.0, 33.0, 34.0, 31.0, 34.0, 43.0, 49.0, 37.0, 43.0, 40.0, 42.0, 42.0, 38.0, 41.0, 25.0, 30.0, 28.0, 27.0, 37.0, 25.0, 22.0, 10.0, 12.0, 13.0, 11.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.53125, -19.914794921875, -19.29833984375, -18.681884765625, -18.0654296875, -17.448974609375, -16.83251953125, -16.216064453125, -15.599609375, -14.983154296875, -14.36669921875, -13.750244140625, -13.1337890625, -12.517333984375, -11.90087890625, -11.284423828125, -10.66796875, -10.051513671875, -9.43505859375, -8.818603515625, -8.2021484375, -7.585693359375, -6.96923828125, -6.352783203125, -5.736328125, -5.119873046875, -4.50341796875, -3.886962890625, -3.2705078125, -2.654052734375, -2.03759765625, -1.421142578125, -0.8046875, -0.188232421875, 0.42822265625, 1.044677734375, 1.6611328125, 2.277587890625, 2.89404296875, 3.510498046875, 4.126953125, 4.743408203125, 5.35986328125, 5.976318359375, 6.5927734375, 7.209228515625, 7.82568359375, 8.442138671875, 9.05859375, 9.675048828125, 10.29150390625, 10.907958984375, 11.5244140625, 12.140869140625, 12.75732421875, 13.373779296875, 13.990234375, 14.606689453125, 15.22314453125, 15.839599609375, 16.4560546875, 17.072509765625, 17.68896484375, 18.305419921875, 18.921875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 13.0, 3.0, 8.0, 23.0, 22.0, 57.0, 83.0, 145.0, 197.0, 314.0, 557.0, 833.0, 1429.0, 2373.0, 4040.0, 7020.0, 11800.0, 20326.0, 34082.0, 56699.0, 91825.0, 145176.0, 218497.0, 308582.0, 405191.0, 480023.0, 514580.0, 491176.0, 422178.0, 328311.0, 235137.0, 157857.0, 100700.0, 62319.0, 37673.0, 22568.0, 13219.0, 7820.0, 4620.0, 2684.0, 1648.0, 986.0, 562.0, 358.0, 229.0, 127.0, 85.0, 49.0, 41.0, 23.0, 8.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.015625, -16.49365234375, -15.9716796875, -15.44970703125, -14.927734375, -14.40576171875, -13.8837890625, -13.36181640625, -12.83984375, -12.31787109375, -11.7958984375, -11.27392578125, -10.751953125, -10.22998046875, -9.7080078125, -9.18603515625, -8.6640625, -8.14208984375, -7.6201171875, -7.09814453125, -6.576171875, -6.05419921875, -5.5322265625, -5.01025390625, -4.48828125, -3.96630859375, -3.4443359375, -2.92236328125, -2.400390625, -1.87841796875, -1.3564453125, -0.83447265625, -0.3125, 0.20947265625, 0.7314453125, 1.25341796875, 1.775390625, 2.29736328125, 2.8193359375, 3.34130859375, 3.86328125, 4.38525390625, 4.9072265625, 5.42919921875, 5.951171875, 6.47314453125, 6.9951171875, 7.51708984375, 8.0390625, 8.56103515625, 9.0830078125, 9.60498046875, 10.126953125, 10.64892578125, 11.1708984375, 11.69287109375, 12.21484375, 12.73681640625, 13.2587890625, 13.78076171875, 14.302734375, 14.82470703125, 15.3466796875, 15.86865234375, 16.390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 7.0, 18.0, 18.0, 23.0, 33.0, 35.0, 55.0, 57.0, 64.0, 89.0, 91.0, 106.0, 117.0, 152.0, 138.0, 154.0, 191.0, 183.0, 210.0, 207.0, 190.0, 206.0, 197.0, 155.0, 194.0, 193.0, 141.0, 166.0, 114.0, 102.0, 89.0, 70.0, 53.0, 45.0, 39.0, 35.0, 28.0, 23.0, 16.0, 15.0, 10.0, 11.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.828125, -8.57293701171875, -8.3177490234375, -8.06256103515625, -7.807373046875, -7.55218505859375, -7.2969970703125, -7.04180908203125, -6.78662109375, -6.53143310546875, -6.2762451171875, -6.02105712890625, -5.765869140625, -5.51068115234375, -5.2554931640625, -5.00030517578125, -4.7451171875, -4.48992919921875, -4.2347412109375, -3.97955322265625, -3.724365234375, -3.46917724609375, -3.2139892578125, -2.95880126953125, -2.70361328125, -2.44842529296875, -2.1932373046875, -1.93804931640625, -1.682861328125, -1.42767333984375, -1.1724853515625, -0.91729736328125, -0.662109375, -0.40692138671875, -0.1517333984375, 0.10345458984375, 0.358642578125, 0.61383056640625, 0.8690185546875, 1.12420654296875, 1.37939453125, 1.63458251953125, 1.8897705078125, 2.14495849609375, 2.400146484375, 2.65533447265625, 2.9105224609375, 3.16571044921875, 3.4208984375, 3.67608642578125, 3.9312744140625, 4.18646240234375, 4.441650390625, 4.69683837890625, 4.9520263671875, 5.20721435546875, 5.46240234375, 5.71759033203125, 5.9727783203125, 6.22796630859375, 6.483154296875, 6.73834228515625, 6.9935302734375, 7.24871826171875, 7.50390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 9.0, 5.0, 14.0, 19.0, 17.0, 23.0, 17.0, 24.0, 18.0, 28.0, 27.0, 27.0, 31.0, 43.0, 34.0, 43.0, 30.0, 39.0, 40.0, 49.0, 41.0, 40.0, 45.0, 37.0, 30.0, 29.0, 33.0, 30.0, 28.0, 19.0, 22.0, 16.0, 9.0, 10.0, 9.0, 8.0, 10.0, 9.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.20712661743164, -16.641019821166992, -16.074913024902344, -15.508807182312012, -14.94270133972168, -14.376594543457031, -13.810487747192383, -13.244380950927734, -12.678275108337402, -12.112168312072754, -11.546062469482422, -10.979955673217773, -10.413848876953125, -9.847743034362793, -9.281636238098145, -8.715530395507812, -8.149423599243164, -7.583317279815674, -7.017210960388184, -6.451104164123535, -5.884997844696045, -5.318891525268555, -4.752784729003906, -4.186678409576416, -3.620572090148926, -3.0544657707214355, -2.488359212875366, -1.9222527742385864, -1.3561463356018066, -0.7900400161743164, -0.22393345832824707, 0.34217309951782227, 0.9082794189453125, 1.4743858575820923, 2.040492296218872, 2.6065988540649414, 3.1727051734924316, 3.738811492919922, 4.30491828918457, 4.8710246086120605, 5.437130928039551, 6.003237247467041, 6.569343566894531, 7.13545036315918, 7.70155668258667, 8.26766300201416, 8.833769798278809, 9.39987564086914, 9.965982437133789, 10.532089233398438, 11.09819507598877, 11.664301872253418, 12.23040771484375, 12.796514511108398, 13.362621307373047, 13.928728103637695, 14.494833946228027, 15.060940742492676, 15.627046585083008, 16.193153381347656, 16.759260177612305, 17.325366973876953, 17.89147186279297, 18.457578659057617, 19.023685455322266]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 11.0, 15.0, 14.0, 17.0, 20.0, 25.0, 19.0, 19.0, 26.0, 36.0, 29.0, 27.0, 32.0, 28.0, 53.0, 54.0, 41.0, 43.0, 42.0, 30.0, 34.0, 42.0, 39.0, 35.0, 31.0, 39.0, 31.0, 35.0, 27.0, 10.0, 15.0, 15.0, 8.0, 17.0, 6.0, 7.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.807043075561523, -20.106842041015625, -19.406641006469727, -18.706439971923828, -18.006237030029297, -17.3060359954834, -16.6058349609375, -15.905633926391602, -15.205431938171387, -14.505230903625488, -13.805028915405273, -13.104827880859375, -12.404626846313477, -11.704424858093262, -11.004223823547363, -10.304021835327148, -9.60382080078125, -8.903619766235352, -8.203417778015137, -7.503216743469238, -6.803015232086182, -6.102813720703125, -5.402612686157227, -4.70241117477417, -4.002209663391113, -3.3020081520080566, -2.601806879043579, -1.9016056060791016, -1.201404094696045, -0.5012025833129883, 0.19899845123291016, 0.8991999626159668, 1.5994014739990234, 2.29960298538208, 2.9998042583465576, 3.700005531311035, 4.400207042694092, 5.100408554077148, 5.800609588623047, 6.5008111000061035, 7.20101261138916, 7.901214122772217, 8.601415634155273, 9.301616668701172, 10.00181770324707, 10.702019691467285, 11.402220726013184, 12.102422714233398, 12.802623748779297, 13.502824783325195, 14.20302677154541, 14.903227806091309, 15.603429794311523, 16.303630828857422, 17.00383186340332, 17.70403289794922, 18.40423583984375, 19.10443687438965, 19.804637908935547, 20.504840850830078, 21.205041885375977, 21.905242919921875, 22.605443954467773, 23.305644989013672, 24.00584602355957]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 11.0, 13.0, 16.0, 29.0, 46.0, 61.0, 144.0, 138.0, 275.0, 477.0, 676.0, 1151.0, 1905.0, 2937.0, 4686.0, 7504.0, 12225.0, 19777.0, 31052.0, 49292.0, 74998.0, 108021.0, 138145.0, 150413.0, 136343.0, 105495.0, 73734.0, 48176.0, 30477.0, 19148.0, 11694.0, 7244.0, 4490.0, 2835.0, 1758.0, 1080.0, 765.0, 465.0, 311.0, 177.0, 126.0, 80.0, 50.0, 43.0, 32.0, 14.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2890625, -4.160919189453125, -4.03277587890625, -3.904632568359375, -3.7764892578125, -3.648345947265625, -3.52020263671875, -3.392059326171875, -3.263916015625, -3.135772705078125, -3.00762939453125, -2.879486083984375, -2.7513427734375, -2.623199462890625, -2.49505615234375, -2.366912841796875, -2.23876953125, -2.110626220703125, -1.98248291015625, -1.854339599609375, -1.7261962890625, -1.598052978515625, -1.46990966796875, -1.341766357421875, -1.213623046875, -1.085479736328125, -0.95733642578125, -0.829193115234375, -0.7010498046875, -0.572906494140625, -0.44476318359375, -0.316619873046875, -0.1884765625, -0.060333251953125, 0.06781005859375, 0.195953369140625, 0.3240966796875, 0.452239990234375, 0.58038330078125, 0.708526611328125, 0.836669921875, 0.964813232421875, 1.09295654296875, 1.221099853515625, 1.3492431640625, 1.477386474609375, 1.60552978515625, 1.733673095703125, 1.86181640625, 1.989959716796875, 2.11810302734375, 2.246246337890625, 2.3743896484375, 2.502532958984375, 2.63067626953125, 2.758819580078125, 2.886962890625, 3.015106201171875, 3.14324951171875, 3.271392822265625, 3.3995361328125, 3.527679443359375, 3.65582275390625, 3.783966064453125, 3.912109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 14.0, 22.0, 21.0, 20.0, 19.0, 27.0, 38.0, 28.0, 27.0, 34.0, 25.0, 55.0, 53.0, 46.0, 41.0, 39.0, 33.0, 32.0, 44.0, 34.0, 38.0, 31.0, 38.0, 29.0, 36.0, 27.0, 10.0, 15.0, 14.0, 7.0, 19.0, 4.0, 8.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.921875, -20.218994140625, -19.51611328125, -18.813232421875, -18.1103515625, -17.407470703125, -16.70458984375, -16.001708984375, -15.298828125, -14.595947265625, -13.89306640625, -13.190185546875, -12.4873046875, -11.784423828125, -11.08154296875, -10.378662109375, -9.67578125, -8.972900390625, -8.27001953125, -7.567138671875, -6.8642578125, -6.161376953125, -5.45849609375, -4.755615234375, -4.052734375, -3.349853515625, -2.64697265625, -1.944091796875, -1.2412109375, -0.538330078125, 0.16455078125, 0.867431640625, 1.5703125, 2.273193359375, 2.97607421875, 3.678955078125, 4.3818359375, 5.084716796875, 5.78759765625, 6.490478515625, 7.193359375, 7.896240234375, 8.59912109375, 9.302001953125, 10.0048828125, 10.707763671875, 11.41064453125, 12.113525390625, 12.81640625, 13.519287109375, 14.22216796875, 14.925048828125, 15.6279296875, 16.330810546875, 17.03369140625, 17.736572265625, 18.439453125, 19.142333984375, 19.84521484375, 20.548095703125, 21.2509765625, 21.953857421875, 22.65673828125, 23.359619140625, 24.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 13.0, 12.0, 25.0, 35.0, 49.0, 68.0, 115.0, 171.0, 246.0, 421.0, 684.0, 1209.0, 1959.0, 3392.0, 5883.0, 10292.0, 18899.0, 41664.0, 765946.0, 138174.0, 26777.0, 13933.0, 7670.0, 4351.0, 2576.0, 1515.0, 922.0, 572.0, 328.0, 237.0, 136.0, 92.0, 52.0, 35.0, 36.0, 16.0, 11.0, 16.0, 10.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6171875, -9.3143310546875, -9.011474609375, -8.7086181640625, -8.40576171875, -8.1029052734375, -7.800048828125, -7.4971923828125, -7.1943359375, -6.8914794921875, -6.588623046875, -6.2857666015625, -5.98291015625, -5.6800537109375, -5.377197265625, -5.0743408203125, -4.771484375, -4.4686279296875, -4.165771484375, -3.8629150390625, -3.56005859375, -3.2572021484375, -2.954345703125, -2.6514892578125, -2.3486328125, -2.0457763671875, -1.742919921875, -1.4400634765625, -1.13720703125, -0.8343505859375, -0.531494140625, -0.2286376953125, 0.07421875, 0.3770751953125, 0.679931640625, 0.9827880859375, 1.28564453125, 1.5885009765625, 1.891357421875, 2.1942138671875, 2.4970703125, 2.7999267578125, 3.102783203125, 3.4056396484375, 3.70849609375, 4.0113525390625, 4.314208984375, 4.6170654296875, 4.919921875, 5.2227783203125, 5.525634765625, 5.8284912109375, 6.13134765625, 6.4342041015625, 6.737060546875, 7.0399169921875, 7.3427734375, 7.6456298828125, 7.948486328125, 8.2513427734375, 8.55419921875, 8.8570556640625, 9.159912109375, 9.4627685546875, 9.765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 12.0, 7.0, 13.0, 11.0, 22.0, 16.0, 24.0, 22.0, 29.0, 23.0, 38.0, 37.0, 36.0, 40.0, 31.0, 54.0, 47.0, 48.0, 46.0, 38.0, 34.0, 42.0, 36.0, 39.0, 22.0, 26.0, 34.0, 29.0, 18.0, 26.0, 19.0, 18.0, 14.0, 8.0, 13.0, 4.0, 2.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2265625, -11.7576904296875, -11.288818359375, -10.8199462890625, -10.35107421875, -9.8822021484375, -9.413330078125, -8.9444580078125, -8.4755859375, -8.0067138671875, -7.537841796875, -7.0689697265625, -6.60009765625, -6.1312255859375, -5.662353515625, -5.1934814453125, -4.724609375, -4.2557373046875, -3.786865234375, -3.3179931640625, -2.84912109375, -2.3802490234375, -1.911376953125, -1.4425048828125, -0.9736328125, -0.5047607421875, -0.035888671875, 0.4329833984375, 0.90185546875, 1.3707275390625, 1.839599609375, 2.3084716796875, 2.77734375, 3.2462158203125, 3.715087890625, 4.1839599609375, 4.65283203125, 5.1217041015625, 5.590576171875, 6.0594482421875, 6.5283203125, 6.9971923828125, 7.466064453125, 7.9349365234375, 8.40380859375, 8.8726806640625, 9.341552734375, 9.8104248046875, 10.279296875, 10.7481689453125, 11.217041015625, 11.6859130859375, 12.15478515625, 12.6236572265625, 13.092529296875, 13.5614013671875, 14.0302734375, 14.4991455078125, 14.968017578125, 15.4368896484375, 15.90576171875, 16.3746337890625, 16.843505859375, 17.3123779296875, 17.78125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 5.0, 9.0, 24.0, 18.0, 38.0, 44.0, 53.0, 82.0, 123.0, 155.0, 231.0, 307.0, 537.0, 713.0, 1134.0, 1753.0, 2678.0, 4029.0, 6191.0, 9914.0, 15974.0, 25998.0, 103052.0, 775691.0, 41311.0, 21390.0, 13177.0, 8392.0, 5311.0, 3530.0, 2272.0, 1465.0, 950.0, 598.0, 434.0, 290.0, 203.0, 138.0, 90.0, 55.0, 60.0, 21.0, 23.0, 25.0, 14.0, 10.0, 7.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6513671875, -0.6312103271484375, -0.611053466796875, -0.5908966064453125, -0.57073974609375, -0.5505828857421875, -0.530426025390625, -0.5102691650390625, -0.4901123046875, -0.4699554443359375, -0.449798583984375, -0.4296417236328125, -0.40948486328125, -0.3893280029296875, -0.369171142578125, -0.3490142822265625, -0.328857421875, -0.3087005615234375, -0.288543701171875, -0.2683868408203125, -0.24822998046875, -0.2280731201171875, -0.207916259765625, -0.1877593994140625, -0.1676025390625, -0.1474456787109375, -0.127288818359375, -0.1071319580078125, -0.08697509765625, -0.0668182373046875, -0.046661376953125, -0.0265045166015625, -0.00634765625, 0.0138092041015625, 0.033966064453125, 0.0541229248046875, 0.07427978515625, 0.0944366455078125, 0.114593505859375, 0.1347503662109375, 0.1549072265625, 0.1750640869140625, 0.195220947265625, 0.2153778076171875, 0.23553466796875, 0.2556915283203125, 0.275848388671875, 0.2960052490234375, 0.316162109375, 0.3363189697265625, 0.356475830078125, 0.3766326904296875, 0.39678955078125, 0.4169464111328125, 0.437103271484375, 0.4572601318359375, 0.4774169921875, 0.4975738525390625, 0.517730712890625, 0.5378875732421875, 0.55804443359375, 0.5782012939453125, 0.598358154296875, 0.6185150146484375, 0.638671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 8.0, 6.0, 8.0, 28.0, 28.0, 30.0, 23.0, 38.0, 37.0, 28.0, 52.0, 45.0, 51.0, 59.0, 47.0, 49.0, 58.0, 48.0, 52.0, 51.0, 29.0, 39.0, 35.0, 29.0, 24.0, 17.0, 14.0, 16.0, 12.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.0219554901123047e-05, -2.932269126176834e-05, -2.8425827622413635e-05, -2.752896398305893e-05, -2.6632100343704224e-05, -2.5735236704349518e-05, -2.4838373064994812e-05, -2.3941509425640106e-05, -2.30446457862854e-05, -2.2147782146930695e-05, -2.125091850757599e-05, -2.0354054868221283e-05, -1.9457191228866577e-05, -1.856032758951187e-05, -1.7663463950157166e-05, -1.676660031080246e-05, -1.5869736671447754e-05, -1.4972873032093048e-05, -1.4076009392738342e-05, -1.3179145753383636e-05, -1.228228211402893e-05, -1.1385418474674225e-05, -1.0488554835319519e-05, -9.591691195964813e-06, -8.694827556610107e-06, -7.797963917255402e-06, -6.901100277900696e-06, -6.00423663854599e-06, -5.107372999191284e-06, -4.210509359836578e-06, -3.3136457204818726e-06, -2.4167820811271667e-06, -1.519918441772461e-06, -6.230548024177551e-07, 2.738088369369507e-07, 1.1706724762916565e-06, 2.0675361156463623e-06, 2.964399755001068e-06, 3.861263394355774e-06, 4.75812703371048e-06, 5.6549906730651855e-06, 6.551854312419891e-06, 7.448717951774597e-06, 8.345581591129303e-06, 9.242445230484009e-06, 1.0139308869838715e-05, 1.103617250919342e-05, 1.1933036148548126e-05, 1.2829899787902832e-05, 1.3726763427257538e-05, 1.4623627066612244e-05, 1.552049070596695e-05, 1.6417354345321655e-05, 1.731421798467636e-05, 1.8211081624031067e-05, 1.9107945263385773e-05, 2.000480890274048e-05, 2.0901672542095184e-05, 2.179853618144989e-05, 2.2695399820804596e-05, 2.3592263460159302e-05, 2.4489127099514008e-05, 2.5385990738868713e-05, 2.628285437822342e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 13.0, 12.0, 20.0, 40.0, 40.0, 78.0, 94.0, 150.0, 273.0, 384.0, 575.0, 968.0, 1489.0, 2215.0, 3426.0, 5435.0, 8790.0, 13571.0, 21474.0, 33863.0, 51044.0, 76645.0, 108109.0, 139964.0, 152411.0, 132421.0, 98713.0, 68310.0, 45486.0, 29976.0, 19183.0, 12142.0, 7720.0, 4847.0, 3095.0, 1947.0, 1256.0, 821.0, 539.0, 361.0, 200.0, 152.0, 91.0, 69.0, 45.0, 37.0, 18.0, 18.0, 8.0, 3.0, 3.0, 6.0, 3.0, 0.0, 1.0], "bins": [-0.5859375, -0.5683746337890625, -0.550811767578125, -0.5332489013671875, -0.51568603515625, -0.4981231689453125, -0.480560302734375, -0.4629974365234375, -0.4454345703125, -0.4278717041015625, -0.410308837890625, -0.3927459716796875, -0.37518310546875, -0.3576202392578125, -0.340057373046875, -0.3224945068359375, -0.304931640625, -0.2873687744140625, -0.269805908203125, -0.2522430419921875, -0.23468017578125, -0.2171173095703125, -0.199554443359375, -0.1819915771484375, -0.1644287109375, -0.1468658447265625, -0.129302978515625, -0.1117401123046875, -0.09417724609375, -0.0766143798828125, -0.059051513671875, -0.0414886474609375, -0.02392578125, -0.0063629150390625, 0.011199951171875, 0.0287628173828125, 0.04632568359375, 0.0638885498046875, 0.081451416015625, 0.0990142822265625, 0.1165771484375, 0.1341400146484375, 0.151702880859375, 0.1692657470703125, 0.18682861328125, 0.2043914794921875, 0.221954345703125, 0.2395172119140625, 0.257080078125, 0.2746429443359375, 0.292205810546875, 0.3097686767578125, 0.32733154296875, 0.3448944091796875, 0.362457275390625, 0.3800201416015625, 0.3975830078125, 0.4151458740234375, 0.432708740234375, 0.4502716064453125, 0.46783447265625, 0.4853973388671875, 0.502960205078125, 0.5205230712890625, 0.5380859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 4.0, 7.0, 8.0, 10.0, 15.0, 13.0, 15.0, 22.0, 33.0, 26.0, 27.0, 49.0, 40.0, 60.0, 52.0, 33.0, 66.0, 51.0, 55.0, 57.0, 46.0, 53.0, 40.0, 29.0, 32.0, 30.0, 31.0, 26.0, 15.0, 16.0, 14.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260009765625, -0.25142669677734375, -0.2428436279296875, -0.23426055908203125, -0.225677490234375, -0.21709442138671875, -0.2085113525390625, -0.19992828369140625, -0.19134521484375, -0.18276214599609375, -0.1741790771484375, -0.16559600830078125, -0.157012939453125, -0.14842987060546875, -0.1398468017578125, -0.13126373291015625, -0.1226806640625, -0.11409759521484375, -0.1055145263671875, -0.09693145751953125, -0.088348388671875, -0.07976531982421875, -0.0711822509765625, -0.06259918212890625, -0.05401611328125, -0.04543304443359375, -0.0368499755859375, -0.02826690673828125, -0.019683837890625, -0.01110076904296875, -0.0025177001953125, 0.00606536865234375, 0.0146484375, 0.02323150634765625, 0.0318145751953125, 0.04039764404296875, 0.048980712890625, 0.05756378173828125, 0.0661468505859375, 0.07472991943359375, 0.08331298828125, 0.09189605712890625, 0.1004791259765625, 0.10906219482421875, 0.117645263671875, 0.12622833251953125, 0.1348114013671875, 0.14339447021484375, 0.1519775390625, 0.16056060791015625, 0.1691436767578125, 0.17772674560546875, 0.186309814453125, 0.19489288330078125, 0.2034759521484375, 0.21205902099609375, 0.22064208984375, 0.22922515869140625, 0.2378082275390625, 0.24639129638671875, 0.254974365234375, 0.26355743408203125, 0.2721405029296875, 0.28072357177734375, 0.289306640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 3.0, 10.0, 12.0, 15.0, 16.0, 22.0, 19.0, 20.0, 22.0, 25.0, 28.0, 32.0, 29.0, 38.0, 32.0, 39.0, 38.0, 43.0, 40.0, 42.0, 49.0, 29.0, 47.0, 37.0, 41.0, 27.0, 34.0, 35.0, 30.0, 21.0, 18.0, 19.0, 8.0, 10.0, 12.0, 9.0, 11.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.923259735107422, -17.339920043945312, -16.756580352783203, -16.173240661621094, -15.589900970458984, -15.006561279296875, -14.423221588134766, -13.839881896972656, -13.256542205810547, -12.673202514648438, -12.089862823486328, -11.506523132324219, -10.92318344116211, -10.33984375, -9.75650405883789, -9.173164367675781, -8.589823722839355, -8.006484031677246, -7.423144340515137, -6.839804649353027, -6.256464958190918, -5.673125267028809, -5.089785099029541, -4.506445407867432, -3.9231057167053223, -3.339766025543213, -2.7564263343811035, -2.173086404800415, -1.5897467136383057, -1.0064070224761963, -0.4230670928955078, 0.16027259826660156, 0.7436122894287109, 1.3269519805908203, 1.9102917909622192, 2.493631601333618, 3.0769712924957275, 3.660310983657837, 4.243650913238525, 4.826990604400635, 5.410330295562744, 5.9936699867248535, 6.577009677886963, 7.1603498458862305, 7.74368953704834, 8.32702922821045, 8.910368919372559, 9.493708610534668, 10.077048301696777, 10.660387992858887, 11.243727684020996, 11.827067375183105, 12.410407066345215, 12.993746757507324, 13.57708740234375, 14.16042709350586, 14.743766784667969, 15.327106475830078, 15.910446166992188, 16.493785858154297, 17.077125549316406, 17.660465240478516, 18.243804931640625, 18.827144622802734, 19.410484313964844]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 14.0, 12.0, 19.0, 14.0, 19.0, 23.0, 20.0, 19.0, 28.0, 38.0, 26.0, 32.0, 30.0, 29.0, 53.0, 51.0, 44.0, 43.0, 39.0, 33.0, 34.0, 41.0, 37.0, 35.0, 31.0, 37.0, 32.0, 32.0, 29.0, 10.0, 15.0, 15.0, 9.0, 15.0, 6.0, 7.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.86855125427246, -20.16748809814453, -19.466426849365234, -18.765363693237305, -18.064302444458008, -17.363239288330078, -16.66217803955078, -15.961114883422852, -15.260052680969238, -14.558990478515625, -13.857928276062012, -13.156866073608398, -12.455802917480469, -11.754741668701172, -11.053678512573242, -10.352616310119629, -9.651554107666016, -8.950491905212402, -8.249429702758789, -7.548367023468018, -6.847304821014404, -6.146242618560791, -5.4451799392700195, -4.744117736816406, -4.043055534362793, -3.3419933319091797, -2.6409308910369873, -1.939868450164795, -1.2388062477111816, -0.5377440452575684, 0.16331863403320312, 0.8643808364868164, 1.5654449462890625, 2.266507148742676, 2.967569589614868, 3.6686320304870605, 4.369694232940674, 5.070756435394287, 5.771819114685059, 6.472881317138672, 7.173943519592285, 7.875005722045898, 8.576067924499512, 9.277130126953125, 9.978193283081055, 10.679254531860352, 11.380317687988281, 12.081379890441895, 12.782442092895508, 13.483504295349121, 14.184566497802734, 14.885629653930664, 15.586690902709961, 16.28775405883789, 16.988815307617188, 17.689878463745117, 18.390941619873047, 19.092004776000977, 19.793066024780273, 20.494129180908203, 21.1951904296875, 21.89625358581543, 22.59731674194336, 23.298377990722656, 23.999439239501953]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 10.0, 16.0, 19.0, 29.0, 49.0, 95.0, 126.0, 226.0, 434.0, 700.0, 1214.0, 1972.0, 3396.0, 5905.0, 9873.0, 16053.0, 25774.0, 39737.0, 57834.0, 79255.0, 100430.0, 117281.0, 123303.0, 117319.0, 101544.0, 80627.0, 58080.0, 40200.0, 25937.0, 16447.0, 9983.0, 6011.0, 3663.0, 2085.0, 1222.0, 731.0, 389.0, 238.0, 143.0, 80.0, 46.0, 37.0, 23.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.90625, -16.40185546875, -15.8974609375, -15.39306640625, -14.888671875, -14.38427734375, -13.8798828125, -13.37548828125, -12.87109375, -12.36669921875, -11.8623046875, -11.35791015625, -10.853515625, -10.34912109375, -9.8447265625, -9.34033203125, -8.8359375, -8.33154296875, -7.8271484375, -7.32275390625, -6.818359375, -6.31396484375, -5.8095703125, -5.30517578125, -4.80078125, -4.29638671875, -3.7919921875, -3.28759765625, -2.783203125, -2.27880859375, -1.7744140625, -1.27001953125, -0.765625, -0.26123046875, 0.2431640625, 0.74755859375, 1.251953125, 1.75634765625, 2.2607421875, 2.76513671875, 3.26953125, 3.77392578125, 4.2783203125, 4.78271484375, 5.287109375, 5.79150390625, 6.2958984375, 6.80029296875, 7.3046875, 7.80908203125, 8.3134765625, 8.81787109375, 9.322265625, 9.82666015625, 10.3310546875, 10.83544921875, 11.33984375, 11.84423828125, 12.3486328125, 12.85302734375, 13.357421875, 13.86181640625, 14.3662109375, 14.87060546875, 15.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 6.0, 6.0, 14.0, 11.0, 19.0, 14.0, 21.0, 23.0, 23.0, 15.0, 30.0, 36.0, 28.0, 29.0, 32.0, 27.0, 54.0, 53.0, 45.0, 40.0, 41.0, 36.0, 31.0, 42.0, 40.0, 30.0, 34.0, 38.0, 28.0, 36.0, 26.0, 9.0, 13.0, 18.0, 9.0, 14.0, 5.0, 7.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.609375, -19.916015625, -19.22265625, -18.529296875, -17.8359375, -17.142578125, -16.44921875, -15.755859375, -15.0625, -14.369140625, -13.67578125, -12.982421875, -12.2890625, -11.595703125, -10.90234375, -10.208984375, -9.515625, -8.822265625, -8.12890625, -7.435546875, -6.7421875, -6.048828125, -5.35546875, -4.662109375, -3.96875, -3.275390625, -2.58203125, -1.888671875, -1.1953125, -0.501953125, 0.19140625, 0.884765625, 1.578125, 2.271484375, 2.96484375, 3.658203125, 4.3515625, 5.044921875, 5.73828125, 6.431640625, 7.125, 7.818359375, 8.51171875, 9.205078125, 9.8984375, 10.591796875, 11.28515625, 11.978515625, 12.671875, 13.365234375, 14.05859375, 14.751953125, 15.4453125, 16.138671875, 16.83203125, 17.525390625, 18.21875, 18.912109375, 19.60546875, 20.298828125, 20.9921875, 21.685546875, 22.37890625, 23.072265625, 23.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 24.0, 27.0, 38.0, 60.0, 101.0, 166.0, 293.0, 431.0, 730.0, 1155.0, 1790.0, 3060.0, 4604.0, 7235.0, 11312.0, 17103.0, 25168.0, 36787.0, 50290.0, 66685.0, 82447.0, 97054.0, 105956.0, 106267.0, 99000.0, 86963.0, 70293.0, 53601.0, 39332.0, 27639.0, 18644.0, 12295.0, 8106.0, 5133.0, 3287.0, 2113.0, 1273.0, 814.0, 468.0, 327.0, 192.0, 87.0, 69.0, 52.0, 23.0, 31.0, 10.0, 10.0, 7.0, 2.0, 5.0, 2.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 13.0, 9.0, 16.0, 23.0, 24.0, 16.0, 24.0, 34.0, 27.0, 45.0, 25.0, 28.0, 31.0, 27.0, 33.0, 46.0, 48.0, 53.0, 46.0, 42.0, 29.0, 41.0, 44.0, 39.0, 43.0, 19.0, 27.0, 13.0, 22.0, 18.0, 12.0, 14.0, 13.0, 7.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.8204345703125, -11.367431640625, -10.9144287109375, -10.46142578125, -10.0084228515625, -9.555419921875, -9.1024169921875, -8.6494140625, -8.1964111328125, -7.743408203125, -7.2904052734375, -6.83740234375, -6.3843994140625, -5.931396484375, -5.4783935546875, -5.025390625, -4.5723876953125, -4.119384765625, -3.6663818359375, -3.21337890625, -2.7603759765625, -2.307373046875, -1.8543701171875, -1.4013671875, -0.9483642578125, -0.495361328125, -0.0423583984375, 0.41064453125, 0.8636474609375, 1.316650390625, 1.7696533203125, 2.22265625, 2.6756591796875, 3.128662109375, 3.5816650390625, 4.03466796875, 4.4876708984375, 4.940673828125, 5.3936767578125, 5.8466796875, 6.2996826171875, 6.752685546875, 7.2056884765625, 7.65869140625, 8.1116943359375, 8.564697265625, 9.0177001953125, 9.470703125, 9.9237060546875, 10.376708984375, 10.8297119140625, 11.28271484375, 11.7357177734375, 12.188720703125, 12.6417236328125, 13.0947265625, 13.5477294921875, 14.000732421875, 14.4537353515625, 14.90673828125, 15.3597412109375, 15.812744140625, 16.2657470703125, 16.71875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 2.0, 10.0, 17.0, 43.0, 49.0, 96.0, 127.0, 223.0, 289.0, 468.0, 912.0, 1441.0, 2394.0, 4206.0, 7177.0, 12147.0, 20908.0, 34526.0, 54341.0, 79368.0, 108510.0, 131995.0, 139951.0, 130184.0, 106356.0, 78432.0, 52826.0, 32872.0, 20153.0, 11713.0, 6764.0, 4080.0, 2352.0, 1388.0, 848.0, 531.0, 331.0, 183.0, 115.0, 72.0, 43.0, 34.0, 27.0, 14.0, 8.0, 10.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5078125, -7.27655029296875, -7.0452880859375, -6.81402587890625, -6.582763671875, -6.35150146484375, -6.1202392578125, -5.88897705078125, -5.65771484375, -5.42645263671875, -5.1951904296875, -4.96392822265625, -4.732666015625, -4.50140380859375, -4.2701416015625, -4.03887939453125, -3.8076171875, -3.57635498046875, -3.3450927734375, -3.11383056640625, -2.882568359375, -2.65130615234375, -2.4200439453125, -2.18878173828125, -1.95751953125, -1.72625732421875, -1.4949951171875, -1.26373291015625, -1.032470703125, -0.80120849609375, -0.5699462890625, -0.33868408203125, -0.107421875, 0.12384033203125, 0.3551025390625, 0.58636474609375, 0.817626953125, 1.04888916015625, 1.2801513671875, 1.51141357421875, 1.74267578125, 1.97393798828125, 2.2052001953125, 2.43646240234375, 2.667724609375, 2.89898681640625, 3.1302490234375, 3.36151123046875, 3.5927734375, 3.82403564453125, 4.0552978515625, 4.28656005859375, 4.517822265625, 4.74908447265625, 4.9803466796875, 5.21160888671875, 5.44287109375, 5.67413330078125, 5.9053955078125, 6.13665771484375, 6.367919921875, 6.59918212890625, 6.8304443359375, 7.06170654296875, 7.29296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 6.0, 10.0, 13.0, 21.0, 22.0, 26.0, 37.0, 34.0, 47.0, 58.0, 64.0, 53.0, 63.0, 64.0, 54.0, 63.0, 59.0, 53.0, 59.0, 33.0, 28.0, 15.0, 18.0, 19.0, 10.0, 16.0, 10.0, 13.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00115966796875, -0.0011275634169578552, -0.0010954588651657104, -0.0010633543133735657, -0.001031249761581421, -0.0009991452097892761, -0.0009670406579971313, -0.0009349361062049866, -0.0009028315544128418, -0.000870727002620697, -0.0008386224508285522, -0.0008065178990364075, -0.0007744133472442627, -0.0007423087954521179, -0.0007102042436599731, -0.0006780996918678284, -0.0006459951400756836, -0.0006138905882835388, -0.000581786036491394, -0.0005496814846992493, -0.0005175769329071045, -0.0004854723811149597, -0.00045336782932281494, -0.00042126327753067017, -0.0003891587257385254, -0.0003570541739463806, -0.00032494962215423584, -0.00029284507036209106, -0.0002607405185699463, -0.00022863596677780151, -0.00019653141498565674, -0.00016442686319351196, -0.0001323223114013672, -0.00010021775960922241, -6.811320781707764e-05, -3.600865602493286e-05, -3.904104232788086e-06, 2.820044755935669e-05, 6.0304999351501465e-05, 9.240955114364624e-05, 0.00012451410293579102, 0.0001566186547279358, 0.00018872320652008057, 0.00022082775831222534, 0.0002529323101043701, 0.0002850368618965149, 0.00031714141368865967, 0.00034924596548080444, 0.0003813505172729492, 0.000413455069065094, 0.00044555962085723877, 0.00047766417264938354, 0.0005097687244415283, 0.0005418732762336731, 0.0005739778280258179, 0.0006060823798179626, 0.0006381869316101074, 0.0006702914834022522, 0.000702396035194397, 0.0007345005869865417, 0.0007666051387786865, 0.0007987096905708313, 0.0008308142423629761, 0.0008629187941551208, 0.0008950233459472656]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 20.0, 24.0, 42.0, 38.0, 80.0, 107.0, 179.0, 260.0, 416.0, 629.0, 1104.0, 1673.0, 2874.0, 4584.0, 7591.0, 12383.0, 19987.0, 31777.0, 48718.0, 70055.0, 94365.0, 115835.0, 127541.0, 125653.0, 110428.0, 88466.0, 64429.0, 44144.0, 28890.0, 17780.0, 11131.0, 6778.0, 4049.0, 2449.0, 1516.0, 923.0, 608.0, 342.0, 219.0, 167.0, 87.0, 67.0, 39.0, 27.0, 21.0, 15.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.1328125, -6.9090576171875, -6.685302734375, -6.4615478515625, -6.23779296875, -6.0140380859375, -5.790283203125, -5.5665283203125, -5.3427734375, -5.1190185546875, -4.895263671875, -4.6715087890625, -4.44775390625, -4.2239990234375, -4.000244140625, -3.7764892578125, -3.552734375, -3.3289794921875, -3.105224609375, -2.8814697265625, -2.65771484375, -2.4339599609375, -2.210205078125, -1.9864501953125, -1.7626953125, -1.5389404296875, -1.315185546875, -1.0914306640625, -0.86767578125, -0.6439208984375, -0.420166015625, -0.1964111328125, 0.02734375, 0.2510986328125, 0.474853515625, 0.6986083984375, 0.92236328125, 1.1461181640625, 1.369873046875, 1.5936279296875, 1.8173828125, 2.0411376953125, 2.264892578125, 2.4886474609375, 2.71240234375, 2.9361572265625, 3.159912109375, 3.3836669921875, 3.607421875, 3.8311767578125, 4.054931640625, 4.2786865234375, 4.50244140625, 4.7261962890625, 4.949951171875, 5.1737060546875, 5.3974609375, 5.6212158203125, 5.844970703125, 6.0687255859375, 6.29248046875, 6.5162353515625, 6.739990234375, 6.9637451171875, 7.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 7.0, 5.0, 9.0, 7.0, 14.0, 13.0, 16.0, 20.0, 18.0, 32.0, 37.0, 33.0, 42.0, 43.0, 50.0, 57.0, 54.0, 37.0, 52.0, 51.0, 43.0, 43.0, 40.0, 33.0, 37.0, 40.0, 23.0, 23.0, 18.0, 21.0, 12.0, 19.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.754730224609375, -2.65985107421875, -2.564971923828125, -2.4700927734375, -2.375213623046875, -2.28033447265625, -2.185455322265625, -2.090576171875, -1.995697021484375, -1.90081787109375, -1.805938720703125, -1.7110595703125, -1.616180419921875, -1.52130126953125, -1.426422119140625, -1.33154296875, -1.236663818359375, -1.14178466796875, -1.046905517578125, -0.9520263671875, -0.857147216796875, -0.76226806640625, -0.667388916015625, -0.572509765625, -0.477630615234375, -0.38275146484375, -0.287872314453125, -0.1929931640625, -0.098114013671875, -0.00323486328125, 0.091644287109375, 0.1865234375, 0.281402587890625, 0.37628173828125, 0.471160888671875, 0.5660400390625, 0.660919189453125, 0.75579833984375, 0.850677490234375, 0.945556640625, 1.040435791015625, 1.13531494140625, 1.230194091796875, 1.3250732421875, 1.419952392578125, 1.51483154296875, 1.609710693359375, 1.70458984375, 1.799468994140625, 1.89434814453125, 1.989227294921875, 2.0841064453125, 2.178985595703125, 2.27386474609375, 2.368743896484375, 2.463623046875, 2.558502197265625, 2.65338134765625, 2.748260498046875, 2.8431396484375, 2.938018798828125, 3.03289794921875, 3.127777099609375, 3.22265625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 3.0, 1.0, 14.0, 10.0, 14.0, 5.0, 23.0, 20.0, 10.0, 16.0, 32.0, 24.0, 28.0, 20.0, 40.0, 23.0, 32.0, 44.0, 32.0, 48.0, 30.0, 27.0, 39.0, 45.0, 37.0, 39.0, 33.0, 36.0, 29.0, 34.0, 36.0, 28.0, 33.0, 16.0, 11.0, 16.0, 12.0, 7.0, 11.0, 5.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.452930450439453, -15.895241737365723, -15.337553024291992, -14.779863357543945, -14.222174644470215, -13.664485931396484, -13.106797218322754, -12.549108505249023, -11.991418838500977, -11.433730125427246, -10.876041412353516, -10.318351745605469, -9.760663032531738, -9.202974319458008, -8.645285606384277, -8.087596893310547, -7.529908180236816, -6.972219467163086, -6.414530277252197, -5.856841564178467, -5.299152374267578, -4.741463661193848, -4.183774948120117, -3.6260859966278076, -3.068397045135498, -2.5107080936431885, -1.9530192613601685, -1.3953304290771484, -0.8376414775848389, -0.2799525260925293, 0.27773618698120117, 0.8354251384735107, 1.3931140899658203, 1.9508030414581299, 2.5084919929504395, 3.06618070602417, 3.6238696575164795, 4.181558609008789, 4.7392473220825195, 5.29693603515625, 5.854625225067139, 6.412313938140869, 6.970003128051758, 7.527691841125488, 8.085380554199219, 8.643070220947266, 9.20075798034668, 9.758447647094727, 10.316136360168457, 10.873825073242188, 11.431513786315918, 11.989202499389648, 12.546892166137695, 13.104580879211426, 13.662269592285156, 14.219958305358887, 14.777647018432617, 15.335335731506348, 15.893024444580078, 16.450714111328125, 17.00840187072754, 17.566091537475586, 18.123779296875, 18.681468963623047, 19.239158630371094]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 9.0, 8.0, 7.0, 11.0, 16.0, 14.0, 12.0, 20.0, 26.0, 21.0, 30.0, 28.0, 32.0, 30.0, 34.0, 30.0, 42.0, 41.0, 35.0, 31.0, 38.0, 32.0, 43.0, 35.0, 35.0, 35.0, 37.0, 37.0, 31.0, 33.0, 27.0, 17.0, 20.0, 13.0, 20.0, 13.0, 16.0, 11.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-22.683317184448242, -21.936798095703125, -21.190277099609375, -20.443758010864258, -19.697237014770508, -18.95071792602539, -18.20419692993164, -17.457677841186523, -16.711158752441406, -15.964638710021973, -15.218118667602539, -14.471599578857422, -13.725079536437988, -12.978559494018555, -12.232039451599121, -11.485519409179688, -10.738999366760254, -9.99247932434082, -9.245959281921387, -8.499439239501953, -7.752920150756836, -7.006400108337402, -6.259880065917969, -5.513360500335693, -4.76684045791626, -4.020320415496826, -3.273800849914551, -2.527280807495117, -1.7807610034942627, -1.0342411994934082, -0.2877211570739746, 0.4587984085083008, 1.2053184509277344, 1.9518382549285889, 2.6983580589294434, 3.444878101348877, 4.191397666931152, 4.937917709350586, 5.6844377517700195, 6.430957317352295, 7.1774773597717285, 7.923997402191162, 8.670516967773438, 9.417037010192871, 10.163557052612305, 10.910076141357422, 11.656597137451172, 12.403116226196289, 13.149636268615723, 13.896156311035156, 14.64267635345459, 15.389196395874023, 16.13571548461914, 16.88223648071289, 17.628755569458008, 18.375274658203125, 19.121795654296875, 19.868314743041992, 20.614835739135742, 21.36135482788086, 22.10787582397461, 22.854394912719727, 23.600914001464844, 24.347434997558594, 25.09395408630371]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 3.0, 11.0, 13.0, 11.0, 13.0, 27.0, 31.0, 39.0, 57.0, 74.0, 92.0, 142.0, 225.0, 260.0, 435.0, 660.0, 1042.0, 1433.0, 2065.0, 2873.0, 3630.0, 1025480.0, 3391.0, 2465.0, 1929.0, 1324.0, 886.0, 619.0, 411.0, 272.0, 164.0, 123.0, 82.0, 77.0, 56.0, 42.0, 25.0, 26.0, 21.0, 20.0, 8.0, 12.0, 10.0, 8.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-258.6935119628906, -250.44822692871094, -242.2029266357422, -233.9576416015625, -225.7123565673828, -217.46707153320312, -209.22177124023438, -200.9764862060547, -192.731201171875, -184.4859161376953, -176.24061584472656, -167.99533081054688, -159.7500457763672, -151.5047607421875, -143.25946044921875, -135.01417541503906, -126.76887512207031, -118.5235824584961, -110.2782974243164, -102.03300476074219, -93.7877197265625, -85.54242706298828, -77.29713439941406, -69.05184936523438, -60.806556701660156, -52.5612678527832, -44.31597900390625, -36.07068634033203, -27.825397491455078, -19.580108642578125, -11.334815979003906, -3.089527130126953, 5.15576171875, 13.40105152130127, 21.64634132385254, 29.891632080078125, 38.13692092895508, 46.38220977783203, 54.62750244140625, 62.8727912902832, 71.11808013916016, 79.36337280273438, 87.60865783691406, 95.85395050048828, 104.0992431640625, 112.34452819824219, 120.5898208618164, 128.83511352539062, 137.0803985595703, 145.32568359375, 153.57098388671875, 161.81626892089844, 170.06155395507812, 178.30685424804688, 186.55213928222656, 194.79742431640625, 203.042724609375, 211.2880096435547, 219.53330993652344, 227.77859497070312, 236.0238800048828, 244.2691650390625, 252.51446533203125, 260.759765625, 269.0050354003906]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 11.0, 6.0, 9.0, 16.0, 14.0, 19.0, 31.0, 34.0, 30.0, 44.0, 76.0, 76.0, 106.0, 112.0, 167.0, 221.0, 247.0, 338.0, 485.0, 725.0, 1048.0, 1631.0, 2549.0, 4371.0, 8141.0, 18064.0, 51362288.0, 42859.0, 11473.0, 5912.0, 3471.0, 2130.0, 1288.0, 879.0, 601.0, 401.0, 335.0, 253.0, 181.0, 161.0, 114.0, 99.0, 65.0, 61.0, 45.0, 39.0, 25.0, 20.0, 16.0, 13.0, 10.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 4.0], "bins": [-255.2211151123047, -247.1879425048828, -239.15478515625, -231.12161254882812, -223.08843994140625, -215.05526733398438, -207.02210998535156, -198.9889373779297, -190.95578002929688, -182.922607421875, -174.8894500732422, -166.8562774658203, -158.82310485839844, -150.78994750976562, -142.75677490234375, -134.72360229492188, -126.6904296875, -118.65726470947266, -110.62409210205078, -102.59092712402344, -94.55775451660156, -86.52458953857422, -78.49142456054688, -70.458251953125, -62.425086975097656, -54.39191818237305, -46.35874938964844, -38.325584411621094, -30.292415618896484, -22.259246826171875, -14.226081848144531, -6.192913055419922, 1.840240478515625, 9.873408317565918, 17.90657615661621, 25.939743041992188, 33.9729118347168, 42.006080627441406, 50.03924560546875, 58.07241439819336, 66.10558319091797, 74.13874816894531, 82.17192077636719, 90.20508575439453, 98.23825073242188, 106.27142333984375, 114.3045883178711, 122.33775329589844, 130.3709259033203, 138.4040985107422, 146.437255859375, 154.47042846679688, 162.50360107421875, 170.53677368164062, 178.56993103027344, 186.6031036376953, 194.63626098632812, 202.66943359375, 210.7025909423828, 218.7357635498047, 226.76893615722656, 234.80209350585938, 242.83526611328125, 250.86843872070312, 258.901611328125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 13.0, 10.0, 13.0, 25.0, 30.0, 42.0, 39.0, 57.0, 70.0, 81.0, 96.0, 75.0, 90.0, 74.0, 67.0, 51.0, 32.0, 39.0, 22.0, 15.0, 12.0, 11.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.27764892578125, -109.9367904663086, -103.59593200683594, -97.25507354736328, -90.91421508789062, -84.57335662841797, -78.23249816894531, -71.89164733886719, -65.55078125, -59.209922790527344, -52.86906433105469, -46.52820587158203, -40.187347412109375, -33.84648895263672, -27.505634307861328, -21.164775848388672, -14.823921203613281, -8.483062744140625, -2.142205238342285, 4.198652267456055, 10.539510726928711, 16.880369186401367, 23.22122573852539, 29.562084197998047, 35.9029426574707, 42.24380111694336, 48.584659576416016, 54.925514221191406, 61.26637268066406, 67.60723114013672, 73.94808959960938, 80.28894805908203, 86.62980651855469, 92.97066497802734, 99.3115234375, 105.65238189697266, 111.99324035644531, 118.33409881591797, 124.67495727539062, 131.01580810546875, 137.35667419433594, 143.69752502441406, 150.03839111328125, 156.37924194335938, 162.72010803222656, 169.0609588623047, 175.40182495117188, 181.74267578125, 188.08352661132812, 194.42437744140625, 200.76524353027344, 207.10609436035156, 213.44696044921875, 219.78781127929688, 226.12867736816406, 232.4695281982422, 238.81039428710938, 245.1512451171875, 251.4921112060547, 257.8329772949219, 264.173828125, 270.5146789550781, 276.85552978515625, 283.1964111328125, 289.5372619628906]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 7.0, 18.0, 13.0, 15.0, 23.0, 33.0, 24.0, 27.0, 35.0, 43.0, 66.0, 56.0, 74.0, 86.0, 69.0, 66.0, 66.0, 41.0, 36.0, 28.0, 26.0, 26.0, 23.0, 21.0, 16.0, 16.0, 8.0, 7.0, 5.0, 6.0, 1.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.6728515625, -235.62342834472656, -228.57400512695312, -221.5245819091797, -214.47515869140625, -207.4257354736328, -200.37631225585938, -193.326904296875, -186.2774658203125, -179.22804260253906, -172.17861938476562, -165.1291961669922, -158.07977294921875, -151.0303497314453, -143.98092651367188, -136.9315185546875, -129.88209533691406, -122.83267211914062, -115.78324890136719, -108.73382568359375, -101.68440246582031, -94.63497924804688, -87.58556365966797, -80.53614044189453, -73.4867172241211, -66.43729400634766, -59.38787078857422, -52.33845138549805, -45.28902816772461, -38.23960494995117, -31.190185546875, -24.140762329101562, -17.091354370117188, -10.041932106018066, -2.9925098419189453, 4.056911468505859, 11.106334686279297, 18.155757904052734, 25.205177307128906, 32.254600524902344, 39.30402374267578, 46.35344696044922, 53.402870178222656, 60.45228958129883, 67.501708984375, 74.55113220214844, 81.60055541992188, 88.64997863769531, 95.69940185546875, 102.74882507324219, 109.79824829101562, 116.84767150878906, 123.8970947265625, 130.94651794433594, 137.99594116210938, 145.04534912109375, 152.09478759765625, 159.1442108154297, 166.19363403320312, 173.24305725097656, 180.29248046875, 187.34190368652344, 194.39132690429688, 201.44073486328125, 208.4901580810547]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 14.0, 14.0, 20.0, 29.0, 61.0, 92.0, 140.0, 237.0, 357.0, 641.0, 1060.0, 2000.0, 3972.0, 8654.0, 21970.0, 76550.0, 542762.0, 3292057.0, 184971.0, 36598.0, 12070.0, 4868.0, 2250.0, 1203.0, 662.0, 375.0, 237.0, 135.0, 81.0, 76.0, 38.0, 27.0, 16.0, 12.0, 5.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.7265625, -10.4306640625, -10.134765625, -9.8388671875, -9.54296875, -9.2470703125, -8.951171875, -8.6552734375, -8.359375, -8.0634765625, -7.767578125, -7.4716796875, -7.17578125, -6.8798828125, -6.583984375, -6.2880859375, -5.9921875, -5.6962890625, -5.400390625, -5.1044921875, -4.80859375, -4.5126953125, -4.216796875, -3.9208984375, -3.625, -3.3291015625, -3.033203125, -2.7373046875, -2.44140625, -2.1455078125, -1.849609375, -1.5537109375, -1.2578125, -0.9619140625, -0.666015625, -0.3701171875, -0.07421875, 0.2216796875, 0.517578125, 0.8134765625, 1.109375, 1.4052734375, 1.701171875, 1.9970703125, 2.29296875, 2.5888671875, 2.884765625, 3.1806640625, 3.4765625, 3.7724609375, 4.068359375, 4.3642578125, 4.66015625, 4.9560546875, 5.251953125, 5.5478515625, 5.84375, 6.1396484375, 6.435546875, 6.7314453125, 7.02734375, 7.3232421875, 7.619140625, 7.9150390625, 8.2109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 11.0, 29.0, 35.0, 51.0, 70.0, 81.0, 118.0, 130.0, 109.0, 93.0, 87.0, 54.0, 24.0, 19.0, 16.0, 13.0, 10.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.669921875, -0.6478500366210938, -0.6257781982421875, -0.6037063598632812, -0.581634521484375, -0.5595626831054688, -0.5374908447265625, -0.5154190063476562, -0.49334716796875, -0.47127532958984375, -0.4492034912109375, -0.42713165283203125, -0.405059814453125, -0.38298797607421875, -0.3609161376953125, -0.33884429931640625, -0.3167724609375, -0.29470062255859375, -0.2726287841796875, -0.25055694580078125, -0.228485107421875, -0.20641326904296875, -0.1843414306640625, -0.16226959228515625, -0.14019775390625, -0.11812591552734375, -0.0960540771484375, -0.07398223876953125, -0.051910400390625, -0.02983856201171875, -0.0077667236328125, 0.01430511474609375, 0.036376953125, 0.05844879150390625, 0.0805206298828125, 0.10259246826171875, 0.124664306640625, 0.14673614501953125, 0.1688079833984375, 0.19087982177734375, 0.21295166015625, 0.23502349853515625, 0.2570953369140625, 0.27916717529296875, 0.301239013671875, 0.32331085205078125, 0.3453826904296875, 0.36745452880859375, 0.3895263671875, 0.41159820556640625, 0.4336700439453125, 0.45574188232421875, 0.477813720703125, 0.49988555908203125, 0.5219573974609375, 0.5440292358398438, 0.56610107421875, 0.5881729125976562, 0.6102447509765625, 0.6323165893554688, 0.654388427734375, 0.6764602661132812, 0.6985321044921875, 0.7206039428710938, 0.74267578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 16.0, 13.0, 27.0, 25.0, 43.0, 69.0, 91.0, 128.0, 177.0, 295.0, 523.0, 816.0, 1431.0, 2564.0, 4426.0, 8846.0, 18549.0, 41679.0, 106765.0, 336810.0, 2249787.0, 1037100.0, 238927.0, 80710.0, 32861.0, 15003.0, 7337.0, 3859.0, 2104.0, 1203.0, 763.0, 460.0, 277.0, 176.0, 107.0, 82.0, 61.0, 46.0, 26.0, 22.0, 21.0, 11.0, 12.0, 8.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.73046875, -4.57720947265625, -4.4239501953125, -4.27069091796875, -4.117431640625, -3.96417236328125, -3.8109130859375, -3.65765380859375, -3.50439453125, -3.35113525390625, -3.1978759765625, -3.04461669921875, -2.891357421875, -2.73809814453125, -2.5848388671875, -2.43157958984375, -2.2783203125, -2.12506103515625, -1.9718017578125, -1.81854248046875, -1.665283203125, -1.51202392578125, -1.3587646484375, -1.20550537109375, -1.05224609375, -0.89898681640625, -0.7457275390625, -0.59246826171875, -0.439208984375, -0.28594970703125, -0.1326904296875, 0.02056884765625, 0.173828125, 0.32708740234375, 0.4803466796875, 0.63360595703125, 0.786865234375, 0.94012451171875, 1.0933837890625, 1.24664306640625, 1.39990234375, 1.55316162109375, 1.7064208984375, 1.85968017578125, 2.012939453125, 2.16619873046875, 2.3194580078125, 2.47271728515625, 2.6259765625, 2.77923583984375, 2.9324951171875, 3.08575439453125, 3.239013671875, 3.39227294921875, 3.5455322265625, 3.69879150390625, 3.85205078125, 4.00531005859375, 4.1585693359375, 4.31182861328125, 4.465087890625, 4.61834716796875, 4.7716064453125, 4.92486572265625, 5.078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 9.0, 7.0, 8.0, 15.0, 17.0, 17.0, 21.0, 27.0, 35.0, 50.0, 47.0, 90.0, 93.0, 121.0, 157.0, 196.0, 245.0, 434.0, 966.0, 382.0, 278.0, 182.0, 146.0, 126.0, 89.0, 73.0, 47.0, 32.0, 34.0, 19.0, 21.0, 14.0, 14.0, 4.0, 9.0, 15.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3349609375, -1.28961181640625, -1.2442626953125, -1.19891357421875, -1.153564453125, -1.10821533203125, -1.0628662109375, -1.01751708984375, -0.97216796875, -0.92681884765625, -0.8814697265625, -0.83612060546875, -0.790771484375, -0.74542236328125, -0.7000732421875, -0.65472412109375, -0.609375, -0.56402587890625, -0.5186767578125, -0.47332763671875, -0.427978515625, -0.38262939453125, -0.3372802734375, -0.29193115234375, -0.24658203125, -0.20123291015625, -0.1558837890625, -0.11053466796875, -0.065185546875, -0.01983642578125, 0.0255126953125, 0.07086181640625, 0.1162109375, 0.16156005859375, 0.2069091796875, 0.25225830078125, 0.297607421875, 0.34295654296875, 0.3883056640625, 0.43365478515625, 0.47900390625, 0.52435302734375, 0.5697021484375, 0.61505126953125, 0.660400390625, 0.70574951171875, 0.7510986328125, 0.79644775390625, 0.841796875, 0.88714599609375, 0.9324951171875, 0.97784423828125, 1.023193359375, 1.06854248046875, 1.1138916015625, 1.15924072265625, 1.20458984375, 1.24993896484375, 1.2952880859375, 1.34063720703125, 1.385986328125, 1.43133544921875, 1.4766845703125, 1.52203369140625, 1.5673828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 13.0, 12.0, 25.0, 23.0, 20.0, 21.0, 33.0, 36.0, 46.0, 57.0, 59.0, 60.0, 61.0, 53.0, 59.0, 57.0, 58.0, 42.0, 51.0, 39.0, 27.0, 24.0, 19.0, 19.0, 8.0, 19.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.321364402770996, -6.098531723022461, -5.875699520111084, -5.652866840362549, -5.430034637451172, -5.207201957702637, -4.984369277954102, -4.761537075042725, -4.538704872131348, -4.3158721923828125, -4.0930399894714355, -3.8702073097229004, -3.6473751068115234, -3.4245424270629883, -3.2017099857330322, -2.978877544403076, -2.756044864654541, -2.533212423324585, -2.310379981994629, -2.0875473022460938, -1.8647149801254272, -1.6418825387954712, -1.4190499782562256, -1.1962175369262695, -0.9733850955963135, -0.7505526542663574, -0.5277201533317566, -0.30488765239715576, -0.08205521106719971, 0.14077723026275635, 0.36360979080200195, 0.586442232131958, 0.8092751502990723, 1.0321075916290283, 1.2549400329589844, 1.47777259349823, 1.700605034828186, 1.923437476158142, 2.1462700366973877, 2.3691024780273438, 2.5919349193573, 2.814767360687256, 3.037599802017212, 3.260432243347168, 3.483264923095703, 3.70609712600708, 3.9289298057556152, 4.151762008666992, 4.374594688415527, 4.5974273681640625, 4.8202595710754395, 5.043092250823975, 5.265924453735352, 5.488757133483887, 5.711589813232422, 5.934422016143799, 6.157254219055176, 6.380086898803711, 6.602919101715088, 6.825751781463623, 7.048583984375, 7.271416664123535, 7.49424934387207, 7.717081546783447, 7.939914226531982]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 2.0, 7.0, 7.0, 9.0, 14.0, 15.0, 13.0, 25.0, 15.0, 19.0, 32.0, 28.0, 26.0, 37.0, 41.0, 47.0, 48.0, 48.0, 48.0, 51.0, 53.0, 49.0, 45.0, 36.0, 34.0, 30.0, 38.0, 29.0, 23.0, 24.0, 15.0, 12.0, 16.0, 12.0, 12.0, 3.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.141359329223633, -6.920445442199707, -6.699531555175781, -6.4786176681518555, -6.25770378112793, -6.036789894104004, -5.81587553024292, -5.594961643218994, -5.374047756195068, -5.153133869171143, -4.932219982147217, -4.711306095123291, -4.490391731262207, -4.269477844238281, -4.0485639572143555, -3.8276500701904297, -3.606736183166504, -3.385822296142578, -3.1649084091186523, -2.9439942836761475, -2.7230803966522217, -2.502166509628296, -2.281252384185791, -2.0603384971618652, -1.8394246101379395, -1.6185107231140137, -1.3975967168807983, -1.176682710647583, -0.9557688236236572, -0.7348549365997314, -0.5139409303665161, -0.2930269241333008, -0.072113037109375, 0.14880090951919556, 0.3697148561477661, 0.5906288027763367, 0.8115427494049072, 1.032456636428833, 1.2533706426620483, 1.4742846488952637, 1.6951985359191895, 1.9161124229431152, 2.137026309967041, 2.357940435409546, 2.5788543224334717, 2.7997682094573975, 3.0206823348999023, 3.241596221923828, 3.462510108947754, 3.6834239959716797, 3.9043378829956055, 4.125251770019531, 4.346165657043457, 4.567079544067383, 4.787993907928467, 5.008907794952393, 5.229821681976318, 5.450735569000244, 5.67164945602417, 5.892563343048096, 6.11347770690918, 6.3343915939331055, 6.555305480957031, 6.776219367980957, 6.997133255004883]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 5.0, 11.0, 13.0, 15.0, 31.0, 36.0, 54.0, 92.0, 141.0, 176.0, 295.0, 513.0, 885.0, 1598.0, 3057.0, 6733.0, 17393.0, 57782.0, 268119.0, 514631.0, 124566.0, 31743.0, 10825.0, 4618.0, 2213.0, 1207.0, 652.0, 365.0, 257.0, 170.0, 109.0, 74.0, 44.0, 29.0, 24.0, 18.0, 13.0, 9.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.9765625, -8.689453125, -8.40234375, -8.115234375, -7.828125, -7.541015625, -7.25390625, -6.966796875, -6.6796875, -6.392578125, -6.10546875, -5.818359375, -5.53125, -5.244140625, -4.95703125, -4.669921875, -4.3828125, -4.095703125, -3.80859375, -3.521484375, -3.234375, -2.947265625, -2.66015625, -2.373046875, -2.0859375, -1.798828125, -1.51171875, -1.224609375, -0.9375, -0.650390625, -0.36328125, -0.076171875, 0.2109375, 0.498046875, 0.78515625, 1.072265625, 1.359375, 1.646484375, 1.93359375, 2.220703125, 2.5078125, 2.794921875, 3.08203125, 3.369140625, 3.65625, 3.943359375, 4.23046875, 4.517578125, 4.8046875, 5.091796875, 5.37890625, 5.666015625, 5.953125, 6.240234375, 6.52734375, 6.814453125, 7.1015625, 7.388671875, 7.67578125, 7.962890625, 8.25, 8.537109375, 8.82421875, 9.111328125, 9.3984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 9.0, 13.0, 16.0, 22.0, 22.0, 58.0, 44.0, 58.0, 66.0, 94.0, 98.0, 99.0, 101.0, 78.0, 54.0, 36.0, 33.0, 28.0, 20.0, 16.0, 8.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6953125, -0.6726303100585938, -0.6499481201171875, -0.6272659301757812, -0.604583740234375, -0.5819015502929688, -0.5592193603515625, -0.5365371704101562, -0.51385498046875, -0.49117279052734375, -0.4684906005859375, -0.44580841064453125, -0.423126220703125, -0.40044403076171875, -0.3777618408203125, -0.35507965087890625, -0.3323974609375, -0.30971527099609375, -0.2870330810546875, -0.26435089111328125, -0.241668701171875, -0.21898651123046875, -0.1963043212890625, -0.17362213134765625, -0.15093994140625, -0.12825775146484375, -0.1055755615234375, -0.08289337158203125, -0.060211181640625, -0.03752899169921875, -0.0148468017578125, 0.00783538818359375, 0.030517578125, 0.05319976806640625, 0.0758819580078125, 0.09856414794921875, 0.121246337890625, 0.14392852783203125, 0.1666107177734375, 0.18929290771484375, 0.21197509765625, 0.23465728759765625, 0.2573394775390625, 0.28002166748046875, 0.302703857421875, 0.32538604736328125, 0.3480682373046875, 0.37075042724609375, 0.3934326171875, 0.41611480712890625, 0.4387969970703125, 0.46147918701171875, 0.484161376953125, 0.5068435668945312, 0.5295257568359375, 0.5522079467773438, 0.57489013671875, 0.5975723266601562, 0.6202545166015625, 0.6429367065429688, 0.665618896484375, 0.6883010864257812, 0.7109832763671875, 0.7336654663085938, 0.75634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 11.0, 11.0, 13.0, 26.0, 20.0, 37.0, 61.0, 85.0, 120.0, 190.0, 293.0, 447.0, 815.0, 1401.0, 2399.0, 4462.0, 8661.0, 19865.0, 67595.0, 417823.0, 417746.0, 67624.0, 19704.0, 8771.0, 4363.0, 2470.0, 1335.0, 852.0, 470.0, 316.0, 190.0, 131.0, 74.0, 51.0, 41.0, 15.0, 15.0, 13.0, 16.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.515625, -8.24951171875, -7.9833984375, -7.71728515625, -7.451171875, -7.18505859375, -6.9189453125, -6.65283203125, -6.38671875, -6.12060546875, -5.8544921875, -5.58837890625, -5.322265625, -5.05615234375, -4.7900390625, -4.52392578125, -4.2578125, -3.99169921875, -3.7255859375, -3.45947265625, -3.193359375, -2.92724609375, -2.6611328125, -2.39501953125, -2.12890625, -1.86279296875, -1.5966796875, -1.33056640625, -1.064453125, -0.79833984375, -0.5322265625, -0.26611328125, 0.0, 0.26611328125, 0.5322265625, 0.79833984375, 1.064453125, 1.33056640625, 1.5966796875, 1.86279296875, 2.12890625, 2.39501953125, 2.6611328125, 2.92724609375, 3.193359375, 3.45947265625, 3.7255859375, 3.99169921875, 4.2578125, 4.52392578125, 4.7900390625, 5.05615234375, 5.322265625, 5.58837890625, 5.8544921875, 6.12060546875, 6.38671875, 6.65283203125, 6.9189453125, 7.18505859375, 7.451171875, 7.71728515625, 7.9833984375, 8.24951171875, 8.515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 12.0, 7.0, 6.0, 17.0, 16.0, 21.0, 23.0, 17.0, 27.0, 28.0, 36.0, 38.0, 33.0, 43.0, 37.0, 45.0, 35.0, 38.0, 53.0, 42.0, 40.0, 49.0, 33.0, 31.0, 40.0, 33.0, 26.0, 25.0, 25.0, 14.0, 17.0, 23.0, 12.0, 13.0, 12.0, 1.0, 8.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.376800537109375, -3.26141357421875, -3.146026611328125, -3.0306396484375, -2.915252685546875, -2.79986572265625, -2.684478759765625, -2.569091796875, -2.453704833984375, -2.33831787109375, -2.222930908203125, -2.1075439453125, -1.992156982421875, -1.87677001953125, -1.761383056640625, -1.64599609375, -1.530609130859375, -1.41522216796875, -1.299835205078125, -1.1844482421875, -1.069061279296875, -0.95367431640625, -0.838287353515625, -0.722900390625, -0.607513427734375, -0.49212646484375, -0.376739501953125, -0.2613525390625, -0.145965576171875, -0.03057861328125, 0.084808349609375, 0.2001953125, 0.315582275390625, 0.43096923828125, 0.546356201171875, 0.6617431640625, 0.777130126953125, 0.89251708984375, 1.007904052734375, 1.123291015625, 1.238677978515625, 1.35406494140625, 1.469451904296875, 1.5848388671875, 1.700225830078125, 1.81561279296875, 1.930999755859375, 2.04638671875, 2.161773681640625, 2.27716064453125, 2.392547607421875, 2.5079345703125, 2.623321533203125, 2.73870849609375, 2.854095458984375, 2.969482421875, 3.084869384765625, 3.20025634765625, 3.315643310546875, 3.4310302734375, 3.546417236328125, 3.66180419921875, 3.777191162109375, 3.892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 6.0, 8.0, 4.0, 10.0, 8.0, 13.0, 19.0, 34.0, 47.0, 60.0, 94.0, 122.0, 197.0, 301.0, 445.0, 742.0, 1204.0, 2062.0, 3860.0, 7645.0, 17715.0, 49692.0, 225096.0, 548921.0, 128798.0, 34309.0, 13243.0, 6157.0, 3134.0, 1682.0, 1013.0, 629.0, 418.0, 266.0, 183.0, 133.0, 90.0, 69.0, 44.0, 29.0, 15.0, 15.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.99609375, -5.8106689453125, -5.625244140625, -5.4398193359375, -5.25439453125, -5.0689697265625, -4.883544921875, -4.6981201171875, -4.5126953125, -4.3272705078125, -4.141845703125, -3.9564208984375, -3.77099609375, -3.5855712890625, -3.400146484375, -3.2147216796875, -3.029296875, -2.8438720703125, -2.658447265625, -2.4730224609375, -2.28759765625, -2.1021728515625, -1.916748046875, -1.7313232421875, -1.5458984375, -1.3604736328125, -1.175048828125, -0.9896240234375, -0.80419921875, -0.6187744140625, -0.433349609375, -0.2479248046875, -0.0625, 0.1229248046875, 0.308349609375, 0.4937744140625, 0.67919921875, 0.8646240234375, 1.050048828125, 1.2354736328125, 1.4208984375, 1.6063232421875, 1.791748046875, 1.9771728515625, 2.16259765625, 2.3480224609375, 2.533447265625, 2.7188720703125, 2.904296875, 3.0897216796875, 3.275146484375, 3.4605712890625, 3.64599609375, 3.8314208984375, 4.016845703125, 4.2022705078125, 4.3876953125, 4.5731201171875, 4.758544921875, 4.9439697265625, 5.12939453125, 5.3148193359375, 5.500244140625, 5.6856689453125, 5.87109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 12.0, 12.0, 19.0, 27.0, 29.0, 57.0, 72.0, 133.0, 155.0, 147.0, 105.0, 60.0, 46.0, 27.0, 21.0, 14.0, 9.0, 6.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010309219360351562, -0.0009960383176803589, -0.0009611546993255615, -0.0009262710809707642, -0.0008913874626159668, -0.0008565038442611694, -0.0008216202259063721, -0.0007867366075515747, -0.0007518529891967773, -0.00071696937084198, -0.0006820857524871826, -0.0006472021341323853, -0.0006123185157775879, -0.0005774348974227905, -0.0005425512790679932, -0.0005076676607131958, -0.00047278404235839844, -0.0004379004240036011, -0.0004030168056488037, -0.00036813318729400635, -0.000333249568939209, -0.0002983659505844116, -0.00026348233222961426, -0.0002285987138748169, -0.00019371509552001953, -0.00015883147716522217, -0.0001239478588104248, -8.906424045562744e-05, -5.418062210083008e-05, -1.9297003746032715e-05, 1.558661460876465e-05, 5.047023296356201e-05, 8.535385131835938e-05, 0.00012023746967315674, 0.0001551210880279541, 0.00019000470638275146, 0.00022488832473754883, 0.0002597719430923462, 0.00029465556144714355, 0.0003295391798019409, 0.0003644227981567383, 0.00039930641651153564, 0.000434190034866333, 0.00046907365322113037, 0.0005039572715759277, 0.0005388408899307251, 0.0005737245082855225, 0.0006086081266403198, 0.0006434917449951172, 0.0006783753633499146, 0.0007132589817047119, 0.0007481426000595093, 0.0007830262184143066, 0.000817909836769104, 0.0008527934551239014, 0.0008876770734786987, 0.0009225606918334961, 0.0009574443101882935, 0.0009923279285430908, 0.0010272115468978882, 0.0010620951652526855, 0.001096978783607483, 0.0011318624019622803, 0.0011667460203170776, 0.001201629638671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 15.0, 26.0, 30.0, 33.0, 51.0, 84.0, 107.0, 164.0, 237.0, 348.0, 549.0, 803.0, 1348.0, 2226.0, 3938.0, 6998.0, 14465.0, 36453.0, 144708.0, 544082.0, 208674.0, 46821.0, 17113.0, 8262.0, 4181.0, 2570.0, 1506.0, 922.0, 583.0, 376.0, 245.0, 183.0, 117.0, 99.0, 56.0, 42.0, 33.0, 24.0, 18.0, 17.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.974609375, -3.840362548828125, -3.70611572265625, -3.571868896484375, -3.4376220703125, -3.303375244140625, -3.16912841796875, -3.034881591796875, -2.900634765625, -2.766387939453125, -2.63214111328125, -2.497894287109375, -2.3636474609375, -2.229400634765625, -2.09515380859375, -1.960906982421875, -1.82666015625, -1.692413330078125, -1.55816650390625, -1.423919677734375, -1.2896728515625, -1.155426025390625, -1.02117919921875, -0.886932373046875, -0.752685546875, -0.618438720703125, -0.48419189453125, -0.349945068359375, -0.2156982421875, -0.081451416015625, 0.05279541015625, 0.187042236328125, 0.3212890625, 0.455535888671875, 0.58978271484375, 0.724029541015625, 0.8582763671875, 0.992523193359375, 1.12677001953125, 1.261016845703125, 1.395263671875, 1.529510498046875, 1.66375732421875, 1.798004150390625, 1.9322509765625, 2.066497802734375, 2.20074462890625, 2.334991455078125, 2.46923828125, 2.603485107421875, 2.73773193359375, 2.871978759765625, 3.0062255859375, 3.140472412109375, 3.27471923828125, 3.408966064453125, 3.543212890625, 3.677459716796875, 3.81170654296875, 3.945953369140625, 4.0802001953125, 4.214447021484375, 4.34869384765625, 4.482940673828125, 4.6171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 3.0, 11.0, 8.0, 14.0, 12.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 43.0, 46.0, 33.0, 46.0, 45.0, 63.0, 48.0, 51.0, 52.0, 63.0, 52.0, 44.0, 37.0, 26.0, 34.0, 29.0, 20.0, 22.0, 13.0, 15.0, 8.0, 9.0, 13.0, 9.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.61285400390625, -1.5538330078125, -1.49481201171875, -1.435791015625, -1.37677001953125, -1.3177490234375, -1.25872802734375, -1.19970703125, -1.14068603515625, -1.0816650390625, -1.02264404296875, -0.963623046875, -0.90460205078125, -0.8455810546875, -0.78656005859375, -0.7275390625, -0.66851806640625, -0.6094970703125, -0.55047607421875, -0.491455078125, -0.43243408203125, -0.3734130859375, -0.31439208984375, -0.25537109375, -0.19635009765625, -0.1373291015625, -0.07830810546875, -0.019287109375, 0.03973388671875, 0.0987548828125, 0.15777587890625, 0.216796875, 0.27581787109375, 0.3348388671875, 0.39385986328125, 0.452880859375, 0.51190185546875, 0.5709228515625, 0.62994384765625, 0.68896484375, 0.74798583984375, 0.8070068359375, 0.86602783203125, 0.925048828125, 0.98406982421875, 1.0430908203125, 1.10211181640625, 1.1611328125, 1.22015380859375, 1.2791748046875, 1.33819580078125, 1.397216796875, 1.45623779296875, 1.5152587890625, 1.57427978515625, 1.63330078125, 1.69232177734375, 1.7513427734375, 1.81036376953125, 1.869384765625, 1.92840576171875, 1.9874267578125, 2.04644775390625, 2.10546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 13.0, 14.0, 37.0, 121.0, 318.0, 272.0, 106.0, 23.0, 16.0, 15.0, 9.0, 7.0, 2.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.59197998046875, -153.92050170898438, -150.24903869628906, -146.5775604248047, -142.90609741210938, -139.234619140625, -135.5631561279297, -131.8916778564453, -128.22021484375, -124.54874420166016, -120.87727355957031, -117.20580291748047, -113.53433227539062, -109.86286163330078, -106.19139099121094, -102.51991271972656, -98.84844207763672, -95.17697143554688, -91.50550079345703, -87.83403015136719, -84.16255950927734, -80.4910888671875, -76.81961059570312, -73.14814758300781, -69.47666931152344, -65.8051986694336, -62.13372802734375, -58.462257385253906, -54.79078674316406, -51.11931610107422, -47.44784164428711, -43.776371002197266, -40.10490417480469, -36.433433532714844, -32.761962890625, -29.090490341186523, -25.41901969909668, -21.747549057006836, -18.07607650756836, -14.404605865478516, -10.733135223388672, -7.06166410446167, -3.390192985534668, 0.2812786102294922, 3.952749252319336, 7.62421989440918, 11.295692443847656, 14.9671630859375, 18.638633728027344, 22.310104370117188, 25.98157501220703, 29.653047561645508, 33.32451629638672, 36.99598693847656, 40.66746139526367, 44.338932037353516, 48.01040267944336, 51.6818733215332, 55.35334396362305, 59.024818420410156, 62.6962890625, 66.36775970458984, 70.03923034667969, 73.71070098876953, 77.38217163085938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 45.0, 73.0, 121.0, 147.0, 172.0, 131.0, 86.0, 50.0, 35.0, 16.0, 4.0, 12.0, 10.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-83.10597229003906, -80.67865753173828, -78.2513427734375, -75.82402801513672, -73.39671325683594, -70.96940612792969, -68.54208374023438, -66.11477661132812, -63.687461853027344, -61.26014709472656, -58.83283233642578, -56.405517578125, -53.978206634521484, -51.5508918762207, -49.12357711791992, -46.696266174316406, -44.26894760131836, -41.84163284301758, -39.4143180847168, -36.98700714111328, -34.5596923828125, -32.13237762451172, -29.705062866210938, -27.27775001525879, -24.850435256958008, -22.423120498657227, -19.995807647705078, -17.568492889404297, -15.141179084777832, -12.713865280151367, -10.286550521850586, -7.8592376708984375, -5.431922912597656, -3.0046088695526123, -0.5772948265075684, 1.8500194549560547, 4.2773332595825195, 6.704647064208984, 9.131961822509766, 11.559274673461914, 13.986589431762695, 16.413904190063477, 18.841217041015625, 21.268531799316406, 23.695846557617188, 26.123159408569336, 28.550474166870117, 30.977787017822266, 33.40510177612305, 35.83241653442383, 38.25973129272461, 40.687042236328125, 43.114356994628906, 45.54167175292969, 47.96898651123047, 50.39630126953125, 52.82361602783203, 55.25093078613281, 57.678245544433594, 60.105560302734375, 62.53287124633789, 64.96018981933594, 67.38749694824219, 69.81481170654297, 72.24212646484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 7.0, 11.0, 6.0, 15.0, 23.0, 28.0, 40.0, 47.0, 83.0, 106.0, 168.0, 262.0, 394.0, 664.0, 1203.0, 2230.0, 4730.0, 12543.0, 40005.0, 209370.0, 3663699.0, 197786.0, 38761.0, 11980.0, 4759.0, 2212.0, 1223.0, 663.0, 377.0, 289.0, 177.0, 124.0, 86.0, 44.0, 40.0, 34.0, 19.0, 15.0, 16.0, 7.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.51611328125, -18.8759765625, -18.23583984375, -17.595703125, -16.95556640625, -16.3154296875, -15.67529296875, -15.03515625, -14.39501953125, -13.7548828125, -13.11474609375, -12.474609375, -11.83447265625, -11.1943359375, -10.55419921875, -9.9140625, -9.27392578125, -8.6337890625, -7.99365234375, -7.353515625, -6.71337890625, -6.0732421875, -5.43310546875, -4.79296875, -4.15283203125, -3.5126953125, -2.87255859375, -2.232421875, -1.59228515625, -0.9521484375, -0.31201171875, 0.328125, 0.96826171875, 1.6083984375, 2.24853515625, 2.888671875, 3.52880859375, 4.1689453125, 4.80908203125, 5.44921875, 6.08935546875, 6.7294921875, 7.36962890625, 8.009765625, 8.64990234375, 9.2900390625, 9.93017578125, 10.5703125, 11.21044921875, 11.8505859375, 12.49072265625, 13.130859375, 13.77099609375, 14.4111328125, 15.05126953125, 15.69140625, 16.33154296875, 16.9716796875, 17.61181640625, 18.251953125, 18.89208984375, 19.5322265625, 20.17236328125, 20.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 9.0, 13.0, 18.0, 32.0, 34.0, 50.0, 75.0, 64.0, 78.0, 83.0, 106.0, 78.0, 89.0, 59.0, 47.0, 37.0, 22.0, 22.0, 18.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.7841110229492188, -0.7596282958984375, -0.7351455688476562, -0.710662841796875, -0.6861801147460938, -0.6616973876953125, -0.6372146606445312, -0.61273193359375, -0.5882492065429688, -0.5637664794921875, -0.5392837524414062, -0.514801025390625, -0.49031829833984375, -0.4658355712890625, -0.44135284423828125, -0.4168701171875, -0.39238739013671875, -0.3679046630859375, -0.34342193603515625, -0.318939208984375, -0.29445648193359375, -0.2699737548828125, -0.24549102783203125, -0.22100830078125, -0.19652557373046875, -0.1720428466796875, -0.14756011962890625, -0.123077392578125, -0.09859466552734375, -0.0741119384765625, -0.04962921142578125, -0.025146484375, -0.00066375732421875, 0.0238189697265625, 0.04830169677734375, 0.072784423828125, 0.09726715087890625, 0.1217498779296875, 0.14623260498046875, 0.17071533203125, 0.19519805908203125, 0.2196807861328125, 0.24416351318359375, 0.268646240234375, 0.29312896728515625, 0.3176116943359375, 0.34209442138671875, 0.3665771484375, 0.39105987548828125, 0.4155426025390625, 0.44002532958984375, 0.464508056640625, 0.48899078369140625, 0.5134735107421875, 0.5379562377929688, 0.56243896484375, 0.5869216918945312, 0.6114044189453125, 0.6358871459960938, 0.660369873046875, 0.6848526000976562, 0.7093353271484375, 0.7338180541992188, 0.75830078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 7.0, 7.0, 9.0, 17.0, 25.0, 42.0, 66.0, 89.0, 164.0, 302.0, 580.0, 1249.0, 2884.0, 7858.0, 27418.0, 140164.0, 2571778.0, 1292205.0, 114104.0, 23532.0, 6930.0, 2507.0, 1138.0, 517.0, 287.0, 147.0, 88.0, 55.0, 37.0, 20.0, 21.0, 8.0, 6.0, 1.0, 6.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.546875, -18.0308837890625, -17.514892578125, -16.9989013671875, -16.48291015625, -15.9669189453125, -15.450927734375, -14.9349365234375, -14.4189453125, -13.9029541015625, -13.386962890625, -12.8709716796875, -12.35498046875, -11.8389892578125, -11.322998046875, -10.8070068359375, -10.291015625, -9.7750244140625, -9.259033203125, -8.7430419921875, -8.22705078125, -7.7110595703125, -7.195068359375, -6.6790771484375, -6.1630859375, -5.6470947265625, -5.131103515625, -4.6151123046875, -4.09912109375, -3.5831298828125, -3.067138671875, -2.5511474609375, -2.03515625, -1.5191650390625, -1.003173828125, -0.4871826171875, 0.02880859375, 0.5447998046875, 1.060791015625, 1.5767822265625, 2.0927734375, 2.6087646484375, 3.124755859375, 3.6407470703125, 4.15673828125, 4.6727294921875, 5.188720703125, 5.7047119140625, 6.220703125, 6.7366943359375, 7.252685546875, 7.7686767578125, 8.28466796875, 8.8006591796875, 9.316650390625, 9.8326416015625, 10.3486328125, 10.8646240234375, 11.380615234375, 11.8966064453125, 12.41259765625, 12.9285888671875, 13.444580078125, 13.9605712890625, 14.4765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 10.0, 20.0, 25.0, 43.0, 77.0, 102.0, 171.0, 291.0, 634.0, 1549.0, 480.0, 225.0, 151.0, 100.0, 49.0, 51.0, 26.0, 19.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.275177001953125, -2.19488525390625, -2.114593505859375, -2.0343017578125, -1.954010009765625, -1.87371826171875, -1.793426513671875, -1.713134765625, -1.632843017578125, -1.55255126953125, -1.472259521484375, -1.3919677734375, -1.311676025390625, -1.23138427734375, -1.151092529296875, -1.07080078125, -0.990509033203125, -0.91021728515625, -0.829925537109375, -0.7496337890625, -0.669342041015625, -0.58905029296875, -0.508758544921875, -0.428466796875, -0.348175048828125, -0.26788330078125, -0.187591552734375, -0.1072998046875, -0.027008056640625, 0.05328369140625, 0.133575439453125, 0.2138671875, 0.294158935546875, 0.37445068359375, 0.454742431640625, 0.5350341796875, 0.615325927734375, 0.69561767578125, 0.775909423828125, 0.856201171875, 0.936492919921875, 1.01678466796875, 1.097076416015625, 1.1773681640625, 1.257659912109375, 1.33795166015625, 1.418243408203125, 1.49853515625, 1.578826904296875, 1.65911865234375, 1.739410400390625, 1.8197021484375, 1.899993896484375, 1.98028564453125, 2.060577392578125, 2.140869140625, 2.221160888671875, 2.30145263671875, 2.381744384765625, 2.4620361328125, 2.542327880859375, 2.62261962890625, 2.702911376953125, 2.783203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 15.0, 35.0, 63.0, 145.0, 251.0, 254.0, 121.0, 67.0, 28.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.80404281616211, -28.002899169921875, -27.20175552368164, -26.400611877441406, -25.599468231201172, -24.798324584960938, -23.99717903137207, -23.196035385131836, -22.3948917388916, -21.593748092651367, -20.792604446411133, -19.9914608001709, -19.19031524658203, -18.389171600341797, -17.588027954101562, -16.786884307861328, -15.985740661621094, -15.18459701538086, -14.383453369140625, -13.582308769226074, -12.78116512298584, -11.980021476745605, -11.178876876831055, -10.37773323059082, -9.576589584350586, -8.775445938110352, -7.974301815032959, -7.173157691955566, -6.372014045715332, -5.570870399475098, -4.769726276397705, -3.9685821533203125, -3.167438507080078, -2.3662946224212646, -1.5651507377624512, -0.7640068531036377, 0.03713703155517578, 0.8382806777954102, 1.6394248008728027, 2.4405689239501953, 3.2417125701904297, 4.042856216430664, 4.844000339508057, 5.645144462585449, 6.446288108825684, 7.247431755065918, 8.048576354980469, 8.849720001220703, 9.650863647460938, 10.452007293701172, 11.253150939941406, 12.054295539855957, 12.855439186096191, 13.656582832336426, 14.457727432250977, 15.258871078491211, 16.060014724731445, 16.86115837097168, 17.662302017211914, 18.46344566345215, 19.264591217041016, 20.06573486328125, 20.866878509521484, 21.66802215576172, 22.469165802001953]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 10.0, 7.0, 20.0, 19.0, 26.0, 28.0, 39.0, 44.0, 49.0, 68.0, 72.0, 86.0, 77.0, 77.0, 85.0, 58.0, 56.0, 46.0, 30.0, 23.0, 17.0, 11.0, 12.0, 9.0, 10.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.719928741455078, -7.384385108947754, -7.0488409996032715, -6.713296890258789, -6.377753257751465, -6.042209625244141, -5.706665515899658, -5.371121406555176, -5.035577774047852, -4.700034141540527, -4.364490032196045, -4.0289459228515625, -3.6934022903442383, -3.357858419418335, -3.0223145484924316, -2.6867706775665283, -2.351226806640625, -2.0156829357147217, -1.6801390647888184, -1.344595193862915, -1.0090513229370117, -0.6735074520111084, -0.3379635810852051, -0.002419710159301758, 0.33312416076660156, 0.6686680316925049, 1.0042119026184082, 1.3397557735443115, 1.6752996444702148, 2.010843515396118, 2.3463873863220215, 2.681931257247925, 3.0174760818481445, 3.353019952774048, 3.688563823699951, 4.024107933044434, 4.359651565551758, 4.695195198059082, 5.0307393074035645, 5.366283416748047, 5.701827049255371, 6.037370681762695, 6.372914791107178, 6.70845890045166, 7.044002532958984, 7.379546165466309, 7.715090274810791, 8.050634384155273, 8.386178016662598, 8.721721649169922, 9.057266235351562, 9.392809867858887, 9.728353500366211, 10.063897132873535, 10.39944076538086, 10.7349853515625, 11.070528984069824, 11.406072616577148, 11.741617202758789, 12.077160835266113, 12.412704467773438, 12.748248100280762, 13.083791732788086, 13.419336318969727, 13.75487995147705]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 3.0, 9.0, 9.0, 14.0, 17.0, 28.0, 49.0, 38.0, 130.0, 203.0, 423.0, 939.0, 2343.0, 6224.0, 18476.0, 65047.0, 287830.0, 494146.0, 124560.0, 31833.0, 9972.0, 3577.0, 1401.0, 613.0, 275.0, 152.0, 68.0, 33.0, 36.0, 24.0, 13.0, 14.0, 6.0, 10.0, 4.0, 7.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1522216796875, -8.859130859375, -8.5660400390625, -8.27294921875, -7.9798583984375, -7.686767578125, -7.3936767578125, -7.1005859375, -6.8074951171875, -6.514404296875, -6.2213134765625, -5.92822265625, -5.6351318359375, -5.342041015625, -5.0489501953125, -4.755859375, -4.4627685546875, -4.169677734375, -3.8765869140625, -3.58349609375, -3.2904052734375, -2.997314453125, -2.7042236328125, -2.4111328125, -2.1180419921875, -1.824951171875, -1.5318603515625, -1.23876953125, -0.9456787109375, -0.652587890625, -0.3594970703125, -0.06640625, 0.2266845703125, 0.519775390625, 0.8128662109375, 1.10595703125, 1.3990478515625, 1.692138671875, 1.9852294921875, 2.2783203125, 2.5714111328125, 2.864501953125, 3.1575927734375, 3.45068359375, 3.7437744140625, 4.036865234375, 4.3299560546875, 4.623046875, 4.9161376953125, 5.209228515625, 5.5023193359375, 5.79541015625, 6.0885009765625, 6.381591796875, 6.6746826171875, 6.9677734375, 7.2608642578125, 7.553955078125, 7.8470458984375, 8.14013671875, 8.4332275390625, 8.726318359375, 9.0194091796875, 9.3125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 4.0, 11.0, 7.0, 16.0, 28.0, 28.0, 25.0, 33.0, 52.0, 62.0, 77.0, 74.0, 75.0, 93.0, 77.0, 78.0, 58.0, 45.0, 40.0, 27.0, 24.0, 13.0, 16.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.47760009765625, -0.4547119140625, -0.43182373046875, -0.408935546875, -0.38604736328125, -0.3631591796875, -0.34027099609375, -0.3173828125, -0.29449462890625, -0.2716064453125, -0.24871826171875, -0.225830078125, -0.20294189453125, -0.1800537109375, -0.15716552734375, -0.13427734375, -0.11138916015625, -0.0885009765625, -0.06561279296875, -0.042724609375, -0.01983642578125, 0.0030517578125, 0.02593994140625, 0.048828125, 0.07171630859375, 0.0946044921875, 0.11749267578125, 0.140380859375, 0.16326904296875, 0.1861572265625, 0.20904541015625, 0.23193359375, 0.25482177734375, 0.2777099609375, 0.30059814453125, 0.323486328125, 0.34637451171875, 0.3692626953125, 0.39215087890625, 0.4150390625, 0.43792724609375, 0.4608154296875, 0.48370361328125, 0.506591796875, 0.52947998046875, 0.5523681640625, 0.57525634765625, 0.59814453125, 0.62103271484375, 0.6439208984375, 0.66680908203125, 0.689697265625, 0.71258544921875, 0.7354736328125, 0.75836181640625, 0.78125, 0.80413818359375, 0.8270263671875, 0.84991455078125, 0.872802734375, 0.89569091796875, 0.9185791015625, 0.94146728515625, 0.96435546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 6.0, 7.0, 16.0, 16.0, 16.0, 36.0, 47.0, 64.0, 126.0, 195.0, 388.0, 692.0, 1501.0, 3176.0, 7638.0, 20674.0, 65834.0, 262238.0, 485806.0, 139342.0, 38647.0, 12982.0, 4823.0, 2114.0, 1004.0, 512.0, 275.0, 127.0, 76.0, 52.0, 39.0, 25.0, 15.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3203125, -6.135986328125, -5.95166015625, -5.767333984375, -5.5830078125, -5.398681640625, -5.21435546875, -5.030029296875, -4.845703125, -4.661376953125, -4.47705078125, -4.292724609375, -4.1083984375, -3.924072265625, -3.73974609375, -3.555419921875, -3.37109375, -3.186767578125, -3.00244140625, -2.818115234375, -2.6337890625, -2.449462890625, -2.26513671875, -2.080810546875, -1.896484375, -1.712158203125, -1.52783203125, -1.343505859375, -1.1591796875, -0.974853515625, -0.79052734375, -0.606201171875, -0.421875, -0.237548828125, -0.05322265625, 0.131103515625, 0.3154296875, 0.499755859375, 0.68408203125, 0.868408203125, 1.052734375, 1.237060546875, 1.42138671875, 1.605712890625, 1.7900390625, 1.974365234375, 2.15869140625, 2.343017578125, 2.52734375, 2.711669921875, 2.89599609375, 3.080322265625, 3.2646484375, 3.448974609375, 3.63330078125, 3.817626953125, 4.001953125, 4.186279296875, 4.37060546875, 4.554931640625, 4.7392578125, 4.923583984375, 5.10791015625, 5.292236328125, 5.4765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 8.0, 4.0, 6.0, 4.0, 10.0, 8.0, 7.0, 18.0, 16.0, 19.0, 21.0, 24.0, 22.0, 31.0, 29.0, 29.0, 29.0, 31.0, 39.0, 36.0, 48.0, 42.0, 41.0, 43.0, 36.0, 37.0, 33.0, 39.0, 27.0, 33.0, 27.0, 28.0, 23.0, 19.0, 14.0, 19.0, 14.0, 15.0, 14.0, 11.0, 5.0, 8.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0], "bins": [-2.423828125, -2.35198974609375, -2.2801513671875, -2.20831298828125, -2.136474609375, -2.06463623046875, -1.9927978515625, -1.92095947265625, -1.84912109375, -1.77728271484375, -1.7054443359375, -1.63360595703125, -1.561767578125, -1.48992919921875, -1.4180908203125, -1.34625244140625, -1.2744140625, -1.20257568359375, -1.1307373046875, -1.05889892578125, -0.987060546875, -0.91522216796875, -0.8433837890625, -0.77154541015625, -0.69970703125, -0.62786865234375, -0.5560302734375, -0.48419189453125, -0.412353515625, -0.34051513671875, -0.2686767578125, -0.19683837890625, -0.125, -0.05316162109375, 0.0186767578125, 0.09051513671875, 0.162353515625, 0.23419189453125, 0.3060302734375, 0.37786865234375, 0.44970703125, 0.52154541015625, 0.5933837890625, 0.66522216796875, 0.737060546875, 0.80889892578125, 0.8807373046875, 0.95257568359375, 1.0244140625, 1.09625244140625, 1.1680908203125, 1.23992919921875, 1.311767578125, 1.38360595703125, 1.4554443359375, 1.52728271484375, 1.59912109375, 1.67095947265625, 1.7427978515625, 1.81463623046875, 1.886474609375, 1.95831298828125, 2.0301513671875, 2.10198974609375, 2.173828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 10.0, 12.0, 13.0, 41.0, 37.0, 45.0, 62.0, 82.0, 141.0, 201.0, 258.0, 458.0, 790.0, 1546.0, 3457.0, 9309.0, 37145.0, 283059.0, 606944.0, 78971.0, 15912.0, 5257.0, 2131.0, 1023.0, 571.0, 402.0, 229.0, 108.0, 97.0, 65.0, 40.0, 38.0, 29.0, 23.0, 10.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.515625, -8.2427978515625, -7.969970703125, -7.6971435546875, -7.42431640625, -7.1514892578125, -6.878662109375, -6.6058349609375, -6.3330078125, -6.0601806640625, -5.787353515625, -5.5145263671875, -5.24169921875, -4.9688720703125, -4.696044921875, -4.4232177734375, -4.150390625, -3.8775634765625, -3.604736328125, -3.3319091796875, -3.05908203125, -2.7862548828125, -2.513427734375, -2.2406005859375, -1.9677734375, -1.6949462890625, -1.422119140625, -1.1492919921875, -0.87646484375, -0.6036376953125, -0.330810546875, -0.0579833984375, 0.21484375, 0.4876708984375, 0.760498046875, 1.0333251953125, 1.30615234375, 1.5789794921875, 1.851806640625, 2.1246337890625, 2.3974609375, 2.6702880859375, 2.943115234375, 3.2159423828125, 3.48876953125, 3.7615966796875, 4.034423828125, 4.3072509765625, 4.580078125, 4.8529052734375, 5.125732421875, 5.3985595703125, 5.67138671875, 5.9442138671875, 6.217041015625, 6.4898681640625, 6.7626953125, 7.0355224609375, 7.308349609375, 7.5811767578125, 7.85400390625, 8.1268310546875, 8.399658203125, 8.6724853515625, 8.9453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 10.0, 22.0, 56.0, 185.0, 342.0, 234.0, 77.0, 37.0, 14.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0019779205322265625, -0.0019325986504554749, -0.0018872767686843872, -0.0018419548869132996, -0.001796633005142212, -0.0017513111233711243, -0.0017059892416000366, -0.001660667359828949, -0.0016153454780578613, -0.0015700235962867737, -0.001524701714515686, -0.0014793798327445984, -0.0014340579509735107, -0.001388736069202423, -0.0013434141874313354, -0.0012980923056602478, -0.0012527704238891602, -0.0012074485421180725, -0.0011621266603469849, -0.0011168047785758972, -0.0010714828968048096, -0.001026161015033722, -0.0009808391332626343, -0.0009355172514915466, -0.000890195369720459, -0.0008448734879493713, -0.0007995516061782837, -0.000754229724407196, -0.0007089078426361084, -0.0006635859608650208, -0.0006182640790939331, -0.0005729421973228455, -0.0005276203155517578, -0.00048229843378067017, -0.0004369765520095825, -0.0003916546702384949, -0.0003463327884674072, -0.0003010109066963196, -0.00025568902492523193, -0.0002103671431541443, -0.00016504526138305664, -0.000119723379611969, -7.440149784088135e-05, -2.90796160697937e-05, 1.6242265701293945e-05, 6.156414747238159e-05, 0.00010688602924346924, 0.00015220791101455688, 0.00019752979278564453, 0.00024285167455673218, 0.0002881735563278198, 0.00033349543809890747, 0.0003788173198699951, 0.00042413920164108276, 0.0004694610834121704, 0.0005147829651832581, 0.0005601048469543457, 0.0006054267287254333, 0.000650748610496521, 0.0006960704922676086, 0.0007413923740386963, 0.0007867142558097839, 0.0008320361375808716, 0.0008773580193519592, 0.0009226799011230469]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 17.0, 21.0, 51.0, 110.0, 191.0, 460.0, 1321.0, 4698.0, 28655.0, 625975.0, 363208.0, 18576.0, 3441.0, 1082.0, 376.0, 160.0, 99.0, 48.0, 27.0, 9.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -15.0369873046875, -14.550537109375, -14.0640869140625, -13.57763671875, -13.0911865234375, -12.604736328125, -12.1182861328125, -11.6318359375, -11.1453857421875, -10.658935546875, -10.1724853515625, -9.68603515625, -9.1995849609375, -8.713134765625, -8.2266845703125, -7.740234375, -7.2537841796875, -6.767333984375, -6.2808837890625, -5.79443359375, -5.3079833984375, -4.821533203125, -4.3350830078125, -3.8486328125, -3.3621826171875, -2.875732421875, -2.3892822265625, -1.90283203125, -1.4163818359375, -0.929931640625, -0.4434814453125, 0.04296875, 0.5294189453125, 1.015869140625, 1.5023193359375, 1.98876953125, 2.4752197265625, 2.961669921875, 3.4481201171875, 3.9345703125, 4.4210205078125, 4.907470703125, 5.3939208984375, 5.88037109375, 6.3668212890625, 6.853271484375, 7.3397216796875, 7.826171875, 8.3126220703125, 8.799072265625, 9.2855224609375, 9.77197265625, 10.2584228515625, 10.744873046875, 11.2313232421875, 11.7177734375, 12.2042236328125, 12.690673828125, 13.1771240234375, 13.66357421875, 14.1500244140625, 14.636474609375, 15.1229248046875, 15.609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 9.0, 16.0, 15.0, 11.0, 35.0, 39.0, 57.0, 75.0, 107.0, 129.0, 131.0, 99.0, 87.0, 50.0, 42.0, 26.0, 15.0, 10.0, 10.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.040283203125, -3.90087890625, -3.761474609375, -3.6220703125, -3.482666015625, -3.34326171875, -3.203857421875, -3.064453125, -2.925048828125, -2.78564453125, -2.646240234375, -2.5068359375, -2.367431640625, -2.22802734375, -2.088623046875, -1.94921875, -1.809814453125, -1.67041015625, -1.531005859375, -1.3916015625, -1.252197265625, -1.11279296875, -0.973388671875, -0.833984375, -0.694580078125, -0.55517578125, -0.415771484375, -0.2763671875, -0.136962890625, 0.00244140625, 0.141845703125, 0.28125, 0.420654296875, 0.56005859375, 0.699462890625, 0.8388671875, 0.978271484375, 1.11767578125, 1.257080078125, 1.396484375, 1.535888671875, 1.67529296875, 1.814697265625, 1.9541015625, 2.093505859375, 2.23291015625, 2.372314453125, 2.51171875, 2.651123046875, 2.79052734375, 2.929931640625, 3.0693359375, 3.208740234375, 3.34814453125, 3.487548828125, 3.626953125, 3.766357421875, 3.90576171875, 4.045166015625, 4.1845703125, 4.323974609375, 4.46337890625, 4.602783203125, 4.7421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 14.0, 39.0, 72.0, 154.0, 234.0, 237.0, 121.0, 63.0, 24.0, 11.0, 8.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.095191955566406, -58.200523376464844, -56.305850982666016, -54.41118240356445, -52.516510009765625, -50.62184143066406, -48.7271728515625, -46.83250045776367, -44.93783187866211, -43.04316329956055, -41.14849090576172, -39.253822326660156, -37.35914993286133, -35.464481353759766, -33.56980895996094, -31.675140380859375, -29.78046989440918, -27.885799407958984, -25.99112892150879, -24.096458435058594, -22.20178985595703, -20.307119369506836, -18.41244888305664, -16.517780303955078, -14.623108863830566, -12.728438377380371, -10.833768844604492, -8.939098358154297, -7.04442834854126, -5.149758338928223, -3.2550878524780273, -1.3604183197021484, 0.5342521667480469, 2.428922176361084, 4.323592185974121, 6.218262672424316, 8.112932205200195, 10.00760269165039, 11.902273178100586, 13.796942710876465, 15.69161319732666, 17.58628273010254, 19.480953216552734, 21.37562370300293, 23.270294189453125, 25.164962768554688, 27.059635162353516, 28.954303741455078, 30.848974227905273, 32.74364471435547, 34.63831329345703, 36.53298568725586, 38.42765426635742, 40.32232666015625, 42.21699523925781, 44.111663818359375, 46.0063362121582, 47.901004791259766, 49.795677185058594, 51.690345764160156, 53.585018157958984, 55.47968673706055, 57.374359130859375, 59.26902770996094, 61.1636962890625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 9.0, 9.0, 9.0, 17.0, 29.0, 37.0, 56.0, 93.0, 114.0, 128.0, 124.0, 102.0, 85.0, 72.0, 39.0, 26.0, 13.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.74987030029297, -65.2035903930664, -63.657310485839844, -62.11103057861328, -60.56474685668945, -59.01846694946289, -57.47218704223633, -55.925907135009766, -54.37962341308594, -52.833343505859375, -51.28706359863281, -49.74078369140625, -48.19449996948242, -46.64822006225586, -45.1019401550293, -43.555660247802734, -42.00938034057617, -40.46310043334961, -38.91682052612305, -37.37053680419922, -35.824256896972656, -34.277976989746094, -32.73169708251953, -31.18541717529297, -29.639135360717773, -28.09285545349121, -26.546573638916016, -25.000293731689453, -23.45401382446289, -21.907732009887695, -20.361452102661133, -18.815170288085938, -17.26888656616211, -15.72260570526123, -14.176324844360352, -12.630044937133789, -11.08376407623291, -9.537483215332031, -7.991203308105469, -6.44492244720459, -4.898641586303711, -3.352360963821411, -1.8060803413391113, -0.2597999572753906, 1.2864809036254883, 2.832761764526367, 4.37904167175293, 5.925322532653809, 7.4716033935546875, 9.017884254455566, 10.564165115356445, 12.110445022583008, 13.656725883483887, 15.203006744384766, 16.749286651611328, 18.29556655883789, 19.841848373413086, 21.38812828063965, 22.934410095214844, 24.480690002441406, 26.02696990966797, 27.573251724243164, 29.119531631469727, 30.665813446044922, 32.212093353271484]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 17.0, 13.0, 23.0, 18.0, 18.0, 24.0, 45.0, 43.0, 66.0, 119.0, 157.0, 318.0, 570.0, 1188.0, 2494.0, 5887.0, 15898.0, 55828.0, 472342.0, 3502374.0, 98632.0, 23247.0, 8085.0, 3339.0, 1662.0, 799.0, 384.0, 268.0, 140.0, 92.0, 58.0, 31.0, 33.0, 12.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0], "bins": [-25.640625, -25.0467529296875, -24.452880859375, -23.8590087890625, -23.26513671875, -22.6712646484375, -22.077392578125, -21.4835205078125, -20.8896484375, -20.2957763671875, -19.701904296875, -19.1080322265625, -18.51416015625, -17.9202880859375, -17.326416015625, -16.7325439453125, -16.138671875, -15.5447998046875, -14.950927734375, -14.3570556640625, -13.76318359375, -13.1693115234375, -12.575439453125, -11.9815673828125, -11.3876953125, -10.7938232421875, -10.199951171875, -9.6060791015625, -9.01220703125, -8.4183349609375, -7.824462890625, -7.2305908203125, -6.63671875, -6.0428466796875, -5.448974609375, -4.8551025390625, -4.26123046875, -3.6673583984375, -3.073486328125, -2.4796142578125, -1.8857421875, -1.2918701171875, -0.697998046875, -0.1041259765625, 0.48974609375, 1.0836181640625, 1.677490234375, 2.2713623046875, 2.865234375, 3.4591064453125, 4.052978515625, 4.6468505859375, 5.24072265625, 5.8345947265625, 6.428466796875, 7.0223388671875, 7.6162109375, 8.2100830078125, 8.803955078125, 9.3978271484375, 9.99169921875, 10.5855712890625, 11.179443359375, 11.7733154296875, 12.3671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 2.0, 5.0, 15.0, 23.0, 26.0, 36.0, 51.0, 53.0, 68.0, 83.0, 105.0, 96.0, 104.0, 79.0, 67.0, 58.0, 41.0, 25.0, 20.0, 18.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.11328125, -1.0841827392578125, -1.055084228515625, -1.0259857177734375, -0.99688720703125, -0.9677886962890625, -0.938690185546875, -0.9095916748046875, -0.8804931640625, -0.8513946533203125, -0.822296142578125, -0.7931976318359375, -0.76409912109375, -0.7350006103515625, -0.705902099609375, -0.6768035888671875, -0.647705078125, -0.6186065673828125, -0.589508056640625, -0.5604095458984375, -0.53131103515625, -0.5022125244140625, -0.473114013671875, -0.4440155029296875, -0.4149169921875, -0.3858184814453125, -0.356719970703125, -0.3276214599609375, -0.29852294921875, -0.2694244384765625, -0.240325927734375, -0.2112274169921875, -0.18212890625, -0.1530303955078125, -0.123931884765625, -0.0948333740234375, -0.06573486328125, -0.0366363525390625, -0.007537841796875, 0.0215606689453125, 0.0506591796875, 0.0797576904296875, 0.108856201171875, 0.1379547119140625, 0.16705322265625, 0.1961517333984375, 0.225250244140625, 0.2543487548828125, 0.283447265625, 0.3125457763671875, 0.341644287109375, 0.3707427978515625, 0.39984130859375, 0.4289398193359375, 0.458038330078125, 0.4871368408203125, 0.5162353515625, 0.5453338623046875, 0.574432373046875, 0.6035308837890625, 0.63262939453125, 0.6617279052734375, 0.690826416015625, 0.7199249267578125, 0.7490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 7.0, 12.0, 18.0, 16.0, 19.0, 28.0, 50.0, 103.0, 107.0, 235.0, 495.0, 1201.0, 3448.0, 13301.0, 71063.0, 875539.0, 3093012.0, 109327.0, 18882.0, 4655.0, 1465.0, 562.0, 265.0, 161.0, 99.0, 58.0, 38.0, 28.0, 21.0, 15.0, 8.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.015625, -17.396728515625, -16.77783203125, -16.158935546875, -15.5400390625, -14.921142578125, -14.30224609375, -13.683349609375, -13.064453125, -12.445556640625, -11.82666015625, -11.207763671875, -10.5888671875, -9.969970703125, -9.35107421875, -8.732177734375, -8.11328125, -7.494384765625, -6.87548828125, -6.256591796875, -5.6376953125, -5.018798828125, -4.39990234375, -3.781005859375, -3.162109375, -2.543212890625, -1.92431640625, -1.305419921875, -0.6865234375, -0.067626953125, 0.55126953125, 1.170166015625, 1.7890625, 2.407958984375, 3.02685546875, 3.645751953125, 4.2646484375, 4.883544921875, 5.50244140625, 6.121337890625, 6.740234375, 7.359130859375, 7.97802734375, 8.596923828125, 9.2158203125, 9.834716796875, 10.45361328125, 11.072509765625, 11.69140625, 12.310302734375, 12.92919921875, 13.548095703125, 14.1669921875, 14.785888671875, 15.40478515625, 16.023681640625, 16.642578125, 17.261474609375, 17.88037109375, 18.499267578125, 19.1181640625, 19.737060546875, 20.35595703125, 20.974853515625, 21.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 13.0, 10.0, 22.0, 26.0, 35.0, 40.0, 50.0, 71.0, 87.0, 136.0, 210.0, 372.0, 1331.0, 693.0, 300.0, 184.0, 103.0, 65.0, 70.0, 41.0, 37.0, 35.0, 31.0, 13.0, 21.0, 14.0, 12.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.4291839599609375, -1.375946044921875, -1.3227081298828125, -1.26947021484375, -1.2162322998046875, -1.162994384765625, -1.1097564697265625, -1.0565185546875, -1.0032806396484375, -0.950042724609375, -0.8968048095703125, -0.84356689453125, -0.7903289794921875, -0.737091064453125, -0.6838531494140625, -0.630615234375, -0.5773773193359375, -0.524139404296875, -0.4709014892578125, -0.41766357421875, -0.3644256591796875, -0.311187744140625, -0.2579498291015625, -0.2047119140625, -0.1514739990234375, -0.098236083984375, -0.0449981689453125, 0.00823974609375, 0.0614776611328125, 0.114715576171875, 0.1679534912109375, 0.22119140625, 0.2744293212890625, 0.327667236328125, 0.3809051513671875, 0.43414306640625, 0.4873809814453125, 0.540618896484375, 0.5938568115234375, 0.6470947265625, 0.7003326416015625, 0.753570556640625, 0.8068084716796875, 0.86004638671875, 0.9132843017578125, 0.966522216796875, 1.0197601318359375, 1.072998046875, 1.1262359619140625, 1.179473876953125, 1.2327117919921875, 1.28594970703125, 1.3391876220703125, 1.392425537109375, 1.4456634521484375, 1.4989013671875, 1.5521392822265625, 1.605377197265625, 1.6586151123046875, 1.71185302734375, 1.7650909423828125, 1.818328857421875, 1.8715667724609375, 1.9248046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 20.0, 22.0, 35.0, 39.0, 72.0, 81.0, 106.0, 113.0, 126.0, 115.0, 65.0, 68.0, 29.0, 23.0, 21.0, 12.0, 14.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.629003524780273, -13.258279800415039, -12.887555122375488, -12.516831398010254, -12.14610767364502, -11.775382995605469, -11.404659271240234, -11.033935546875, -10.663211822509766, -10.292488098144531, -9.92176342010498, -9.551039695739746, -9.180315971374512, -8.809591293334961, -8.438867568969727, -8.068143844604492, -7.697419166564941, -7.326694965362549, -6.9559712409973145, -6.585247039794922, -6.2145233154296875, -5.843799114227295, -5.473074913024902, -5.102351188659668, -4.731626987457275, -4.360902786254883, -3.9901790618896484, -3.619454860687256, -3.2487308979034424, -2.878006935119629, -2.5072827339172363, -2.136558771133423, -1.7658357620239258, -1.3951117992401123, -1.0243877172470093, -0.6536636352539062, -0.2829396724700928, 0.0877842903137207, 0.4585084915161133, 0.8292324542999268, 1.1999564170837402, 1.5706803798675537, 1.9414044618606567, 2.3121285438537598, 2.6828525066375732, 3.0535764694213867, 3.4243006706237793, 3.7950246334075928, 4.165748596191406, 4.536472797393799, 4.907196521759033, 5.277920722961426, 5.64864444732666, 6.019368648529053, 6.390092849731445, 6.76081657409668, 7.131540775299072, 7.502264976501465, 7.872988700866699, 8.24371337890625, 8.614437103271484, 8.985160827636719, 9.355884552001953, 9.726609230041504, 10.097332954406738]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 8.0, 13.0, 11.0, 20.0, 26.0, 37.0, 40.0, 54.0, 62.0, 78.0, 94.0, 107.0, 97.0, 74.0, 64.0, 62.0, 57.0, 28.0, 28.0, 21.0, 4.0, 11.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.148794174194336, -7.771350860595703, -7.3939080238342285, -7.016464710235596, -6.639021873474121, -6.261578559875488, -5.8841352462768555, -5.506691932678223, -5.129249095916748, -4.751805782318115, -4.374362945556641, -3.996919631958008, -3.619476556777954, -3.2420334815979004, -2.8645901679992676, -2.487147092819214, -2.10970401763916, -1.7322609424591064, -1.3548177480697632, -0.9773745536804199, -0.5999314785003662, -0.2224884033203125, 0.1549549102783203, 0.532397985458374, 0.9098410606384277, 1.2872841358184814, 1.6647273302078247, 2.042170524597168, 2.4196135997772217, 2.7970566749572754, 3.174499988555908, 3.551943063735962, 3.9293861389160156, 4.306829452514648, 4.684272289276123, 5.061715602874756, 5.4391584396362305, 5.816601753234863, 6.194045066833496, 6.571488380432129, 6.9489312171936035, 7.326374530792236, 7.703817367553711, 8.081260681152344, 8.458703994750977, 8.83614730834961, 9.213590621948242, 9.591032981872559, 9.968476295471191, 10.345919609069824, 10.723362922668457, 11.100805282592773, 11.478248596191406, 11.855691909790039, 12.233135223388672, 12.610578536987305, 12.988021850585938, 13.36546516418457, 13.742908477783203, 14.120351791381836, 14.497794151306152, 14.875237464904785, 15.252680778503418, 15.63012409210205, 16.007566452026367]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 11.0, 26.0, 28.0, 45.0, 63.0, 107.0, 138.0, 210.0, 473.0, 756.0, 1245.0, 2383.0, 4601.0, 9067.0, 19114.0, 42414.0, 98154.0, 214601.0, 305201.0, 191964.0, 86757.0, 37034.0, 16891.0, 8033.0, 4099.0, 2248.0, 1205.0, 647.0, 385.0, 234.0, 131.0, 81.0, 61.0, 34.0, 28.0, 20.0, 7.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.6904296875, -4.525390625, -4.3603515625, -4.1953125, -4.0302734375, -3.865234375, -3.7001953125, -3.53515625, -3.3701171875, -3.205078125, -3.0400390625, -2.875, -2.7099609375, -2.544921875, -2.3798828125, -2.21484375, -2.0498046875, -1.884765625, -1.7197265625, -1.5546875, -1.3896484375, -1.224609375, -1.0595703125, -0.89453125, -0.7294921875, -0.564453125, -0.3994140625, -0.234375, -0.0693359375, 0.095703125, 0.2607421875, 0.42578125, 0.5908203125, 0.755859375, 0.9208984375, 1.0859375, 1.2509765625, 1.416015625, 1.5810546875, 1.74609375, 1.9111328125, 2.076171875, 2.2412109375, 2.40625, 2.5712890625, 2.736328125, 2.9013671875, 3.06640625, 3.2314453125, 3.396484375, 3.5615234375, 3.7265625, 3.8916015625, 4.056640625, 4.2216796875, 4.38671875, 4.5517578125, 4.716796875, 4.8818359375, 5.046875, 5.2119140625, 5.376953125, 5.5419921875, 5.70703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 8.0, 8.0, 5.0, 10.0, 14.0, 20.0, 15.0, 16.0, 38.0, 25.0, 41.0, 32.0, 50.0, 61.0, 41.0, 53.0, 52.0, 53.0, 53.0, 50.0, 44.0, 50.0, 31.0, 33.0, 29.0, 22.0, 25.0, 25.0, 13.0, 15.0, 10.0, 7.0, 7.0, 4.0, 3.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.42612457275390625, -0.4113311767578125, -0.39653778076171875, -0.381744384765625, -0.36695098876953125, -0.3521575927734375, -0.33736419677734375, -0.32257080078125, -0.30777740478515625, -0.2929840087890625, -0.27819061279296875, -0.263397216796875, -0.24860382080078125, -0.2338104248046875, -0.21901702880859375, -0.2042236328125, -0.18943023681640625, -0.1746368408203125, -0.15984344482421875, -0.145050048828125, -0.13025665283203125, -0.1154632568359375, -0.10066986083984375, -0.08587646484375, -0.07108306884765625, -0.0562896728515625, -0.04149627685546875, -0.026702880859375, -0.01190948486328125, 0.0028839111328125, 0.01767730712890625, 0.032470703125, 0.04726409912109375, 0.0620574951171875, 0.07685089111328125, 0.091644287109375, 0.10643768310546875, 0.1212310791015625, 0.13602447509765625, 0.15081787109375, 0.16561126708984375, 0.1804046630859375, 0.19519805908203125, 0.209991455078125, 0.22478485107421875, 0.2395782470703125, 0.25437164306640625, 0.2691650390625, 0.28395843505859375, 0.2987518310546875, 0.31354522705078125, 0.328338623046875, 0.34313201904296875, 0.3579254150390625, 0.37271881103515625, 0.38751220703125, 0.40230560302734375, 0.4170989990234375, 0.43189239501953125, 0.446685791015625, 0.46147918701171875, 0.4762725830078125, 0.49106597900390625, 0.505859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 4.0, 10.0, 14.0, 19.0, 21.0, 12.0, 35.0, 48.0, 78.0, 87.0, 161.0, 285.0, 400.0, 684.0, 1569.0, 4677.0, 20253.0, 123772.0, 531548.0, 302360.0, 48402.0, 9136.0, 2522.0, 1054.0, 512.0, 289.0, 175.0, 128.0, 100.0, 51.0, 37.0, 32.0, 24.0, 14.0, 10.0, 9.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.390625, -10.0633544921875, -9.736083984375, -9.4088134765625, -9.08154296875, -8.7542724609375, -8.427001953125, -8.0997314453125, -7.7724609375, -7.4451904296875, -7.117919921875, -6.7906494140625, -6.46337890625, -6.1361083984375, -5.808837890625, -5.4815673828125, -5.154296875, -4.8270263671875, -4.499755859375, -4.1724853515625, -3.84521484375, -3.5179443359375, -3.190673828125, -2.8634033203125, -2.5361328125, -2.2088623046875, -1.881591796875, -1.5543212890625, -1.22705078125, -0.8997802734375, -0.572509765625, -0.2452392578125, 0.08203125, 0.4093017578125, 0.736572265625, 1.0638427734375, 1.39111328125, 1.7183837890625, 2.045654296875, 2.3729248046875, 2.7001953125, 3.0274658203125, 3.354736328125, 3.6820068359375, 4.00927734375, 4.3365478515625, 4.663818359375, 4.9910888671875, 5.318359375, 5.6456298828125, 5.972900390625, 6.3001708984375, 6.62744140625, 6.9547119140625, 7.281982421875, 7.6092529296875, 7.9365234375, 8.2637939453125, 8.591064453125, 8.9183349609375, 9.24560546875, 9.5728759765625, 9.900146484375, 10.2274169921875, 10.5546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 9.0, 8.0, 6.0, 12.0, 14.0, 11.0, 15.0, 22.0, 17.0, 22.0, 26.0, 20.0, 40.0, 23.0, 32.0, 30.0, 37.0, 42.0, 35.0, 60.0, 49.0, 52.0, 47.0, 43.0, 43.0, 34.0, 32.0, 33.0, 28.0, 15.0, 25.0, 16.0, 20.0, 19.0, 10.0, 9.0, 5.0, 9.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.39593505859375, -2.3094482421875, -2.22296142578125, -2.136474609375, -2.04998779296875, -1.9635009765625, -1.87701416015625, -1.79052734375, -1.70404052734375, -1.6175537109375, -1.53106689453125, -1.444580078125, -1.35809326171875, -1.2716064453125, -1.18511962890625, -1.0986328125, -1.01214599609375, -0.9256591796875, -0.83917236328125, -0.752685546875, -0.66619873046875, -0.5797119140625, -0.49322509765625, -0.40673828125, -0.32025146484375, -0.2337646484375, -0.14727783203125, -0.060791015625, 0.02569580078125, 0.1121826171875, 0.19866943359375, 0.28515625, 0.37164306640625, 0.4581298828125, 0.54461669921875, 0.631103515625, 0.71759033203125, 0.8040771484375, 0.89056396484375, 0.97705078125, 1.06353759765625, 1.1500244140625, 1.23651123046875, 1.322998046875, 1.40948486328125, 1.4959716796875, 1.58245849609375, 1.6689453125, 1.75543212890625, 1.8419189453125, 1.92840576171875, 2.014892578125, 2.10137939453125, 2.1878662109375, 2.27435302734375, 2.36083984375, 2.44732666015625, 2.5338134765625, 2.62030029296875, 2.706787109375, 2.79327392578125, 2.8797607421875, 2.96624755859375, 3.052734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 11.0, 17.0, 23.0, 29.0, 34.0, 51.0, 89.0, 152.0, 246.0, 462.0, 834.0, 1577.0, 3145.0, 7091.0, 16332.0, 43095.0, 131616.0, 366315.0, 313236.0, 103785.0, 34976.0, 13719.0, 5848.0, 2753.0, 1348.0, 714.0, 392.0, 225.0, 130.0, 95.0, 61.0, 50.0, 28.0, 19.0, 11.0, 10.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4921875, -6.3006591796875, -6.109130859375, -5.9176025390625, -5.72607421875, -5.5345458984375, -5.343017578125, -5.1514892578125, -4.9599609375, -4.7684326171875, -4.576904296875, -4.3853759765625, -4.19384765625, -4.0023193359375, -3.810791015625, -3.6192626953125, -3.427734375, -3.2362060546875, -3.044677734375, -2.8531494140625, -2.66162109375, -2.4700927734375, -2.278564453125, -2.0870361328125, -1.8955078125, -1.7039794921875, -1.512451171875, -1.3209228515625, -1.12939453125, -0.9378662109375, -0.746337890625, -0.5548095703125, -0.36328125, -0.1717529296875, 0.019775390625, 0.2113037109375, 0.40283203125, 0.5943603515625, 0.785888671875, 0.9774169921875, 1.1689453125, 1.3604736328125, 1.552001953125, 1.7435302734375, 1.93505859375, 2.1265869140625, 2.318115234375, 2.5096435546875, 2.701171875, 2.8927001953125, 3.084228515625, 3.2757568359375, 3.46728515625, 3.6588134765625, 3.850341796875, 4.0418701171875, 4.2333984375, 4.4249267578125, 4.616455078125, 4.8079833984375, 4.99951171875, 5.1910400390625, 5.382568359375, 5.5740966796875, 5.765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 15.0, 21.0, 32.0, 39.0, 48.0, 64.0, 94.0, 121.0, 117.0, 98.0, 79.0, 56.0, 53.0, 24.0, 35.0, 13.0, 12.0, 10.0, 9.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00092315673828125, -0.0008969902992248535, -0.000870823860168457, -0.0008446574211120605, -0.0008184909820556641, -0.0007923245429992676, -0.0007661581039428711, -0.0007399916648864746, -0.0007138252258300781, -0.0006876587867736816, -0.0006614923477172852, -0.0006353259086608887, -0.0006091594696044922, -0.0005829930305480957, -0.0005568265914916992, -0.0005306601524353027, -0.0005044937133789062, -0.00047832727432250977, -0.0004521608352661133, -0.0004259943962097168, -0.0003998279571533203, -0.00037366151809692383, -0.00034749507904052734, -0.00032132863998413086, -0.0002951622009277344, -0.0002689957618713379, -0.0002428293228149414, -0.00021666288375854492, -0.00019049644470214844, -0.00016433000564575195, -0.00013816356658935547, -0.00011199712753295898, -8.58306884765625e-05, -5.9664249420166016e-05, -3.349781036376953e-05, -7.331371307373047e-06, 1.8835067749023438e-05, 4.500150680541992e-05, 7.11679458618164e-05, 9.733438491821289e-05, 0.00012350082397460938, 0.00014966726303100586, 0.00017583370208740234, 0.00020200014114379883, 0.0002281665802001953, 0.0002543330192565918, 0.0002804994583129883, 0.00030666589736938477, 0.00033283233642578125, 0.00035899877548217773, 0.0003851652145385742, 0.0004113316535949707, 0.0004374980926513672, 0.00046366453170776367, 0.0004898309707641602, 0.0005159974098205566, 0.0005421638488769531, 0.0005683302879333496, 0.0005944967269897461, 0.0006206631660461426, 0.0006468296051025391, 0.0006729960441589355, 0.000699162483215332, 0.0007253289222717285, 0.000751495361328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 5.0, 7.0, 10.0, 7.0, 23.0, 38.0, 46.0, 65.0, 96.0, 247.0, 492.0, 1276.0, 4828.0, 29458.0, 369102.0, 585773.0, 47513.0, 6703.0, 1637.0, 623.0, 249.0, 131.0, 68.0, 49.0, 38.0, 22.0, 14.0, 8.0, 2.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.015625, -14.575439453125, -14.13525390625, -13.695068359375, -13.2548828125, -12.814697265625, -12.37451171875, -11.934326171875, -11.494140625, -11.053955078125, -10.61376953125, -10.173583984375, -9.7333984375, -9.293212890625, -8.85302734375, -8.412841796875, -7.97265625, -7.532470703125, -7.09228515625, -6.652099609375, -6.2119140625, -5.771728515625, -5.33154296875, -4.891357421875, -4.451171875, -4.010986328125, -3.57080078125, -3.130615234375, -2.6904296875, -2.250244140625, -1.81005859375, -1.369873046875, -0.9296875, -0.489501953125, -0.04931640625, 0.390869140625, 0.8310546875, 1.271240234375, 1.71142578125, 2.151611328125, 2.591796875, 3.031982421875, 3.47216796875, 3.912353515625, 4.3525390625, 4.792724609375, 5.23291015625, 5.673095703125, 6.11328125, 6.553466796875, 6.99365234375, 7.433837890625, 7.8740234375, 8.314208984375, 8.75439453125, 9.194580078125, 9.634765625, 10.074951171875, 10.51513671875, 10.955322265625, 11.3955078125, 11.835693359375, 12.27587890625, 12.716064453125, 13.15625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 5.0, 7.0, 7.0, 7.0, 8.0, 13.0, 14.0, 12.0, 13.0, 29.0, 24.0, 31.0, 44.0, 34.0, 55.0, 65.0, 74.0, 85.0, 52.0, 63.0, 52.0, 47.0, 37.0, 40.0, 33.0, 21.0, 20.0, 20.0, 14.0, 11.0, 11.0, 14.0, 7.0, 12.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.628936767578125, -2.54107666015625, -2.453216552734375, -2.3653564453125, -2.277496337890625, -2.18963623046875, -2.101776123046875, -2.013916015625, -1.926055908203125, -1.83819580078125, -1.750335693359375, -1.6624755859375, -1.574615478515625, -1.48675537109375, -1.398895263671875, -1.31103515625, -1.223175048828125, -1.13531494140625, -1.047454833984375, -0.9595947265625, -0.871734619140625, -0.78387451171875, -0.696014404296875, -0.608154296875, -0.520294189453125, -0.43243408203125, -0.344573974609375, -0.2567138671875, -0.168853759765625, -0.08099365234375, 0.006866455078125, 0.0947265625, 0.182586669921875, 0.27044677734375, 0.358306884765625, 0.4461669921875, 0.534027099609375, 0.62188720703125, 0.709747314453125, 0.797607421875, 0.885467529296875, 0.97332763671875, 1.061187744140625, 1.1490478515625, 1.236907958984375, 1.32476806640625, 1.412628173828125, 1.50048828125, 1.588348388671875, 1.67620849609375, 1.764068603515625, 1.8519287109375, 1.939788818359375, 2.02764892578125, 2.115509033203125, 2.203369140625, 2.291229248046875, 2.37908935546875, 2.466949462890625, 2.5548095703125, 2.642669677734375, 2.73052978515625, 2.818389892578125, 2.90625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 20.0, 52.0, 165.0, 314.0, 269.0, 112.0, 42.0, 15.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.85728454589844, -80.73849487304688, -77.61971282958984, -74.50092315673828, -71.38214111328125, -68.26335144042969, -65.14456939697266, -62.025779724121094, -58.90699768066406, -55.788211822509766, -52.66942596435547, -49.55064010620117, -46.431854248046875, -43.31306838989258, -40.19428253173828, -37.07549285888672, -33.95670700073242, -30.837921142578125, -27.719135284423828, -24.60034942626953, -21.481563568115234, -18.362777709960938, -15.243989944458008, -12.125204086303711, -9.006418228149414, -5.887632369995117, -2.768846035003662, 0.34994029998779297, 3.46872615814209, 6.587512016296387, 9.706298828125, 12.825084686279297, 15.943870544433594, 19.06265640258789, 22.181442260742188, 25.300228118896484, 28.41901397705078, 31.537799835205078, 34.656585693359375, 37.77537536621094, 40.89415740966797, 44.012943267822266, 47.13172912597656, 50.25051498413086, 53.369300842285156, 56.48808670043945, 59.60687255859375, 62.72566223144531, 65.84445190429688, 68.96324157714844, 72.08202362060547, 75.20081329345703, 78.31959533691406, 81.43838500976562, 84.55716705322266, 87.67595672607422, 90.79473876953125, 93.91352844238281, 97.03231048583984, 100.1511001586914, 103.26988220214844, 106.388671875, 109.50745391845703, 112.6262435913086, 115.74502563476562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 9.0, 16.0, 4.0, 19.0, 24.0, 18.0, 28.0, 38.0, 38.0, 47.0, 39.0, 49.0, 57.0, 65.0, 48.0, 57.0, 55.0, 50.0, 50.0, 48.0, 43.0, 40.0, 34.0, 33.0, 16.0, 15.0, 14.0, 8.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-30.261804580688477, -29.429311752319336, -28.596818923950195, -27.764326095581055, -26.931833267211914, -26.09933853149414, -25.266845703125, -24.43435287475586, -23.60186004638672, -22.769367218017578, -21.936874389648438, -21.104381561279297, -20.271888732910156, -19.439395904541016, -18.606903076171875, -17.7744083404541, -16.941917419433594, -16.109424591064453, -15.276931762695312, -14.444438934326172, -13.611945152282715, -12.779452323913574, -11.946959495544434, -11.114465713500977, -10.281972885131836, -9.449480056762695, -8.616987228393555, -7.784493923187256, -6.952000617980957, -6.119507789611816, -5.287014961242676, -4.454521656036377, -3.622028350830078, -2.7895352840423584, -1.9570423364639282, -1.124549388885498, -0.2920563220977783, 0.5404367446899414, 1.372929573059082, 2.205422878265381, 3.0379157066345215, 3.870408773422241, 4.702901840209961, 5.535394668579102, 6.367887496948242, 7.200380802154541, 8.032873153686523, 8.86536693572998, 9.697859764099121, 10.530352592468262, 11.362845420837402, 12.19533920288086, 13.02783203125, 13.86032485961914, 14.692817687988281, 15.525310516357422, 16.357803344726562, 17.190296173095703, 18.022789001464844, 18.855281829833984, 19.687774658203125, 20.520267486572266, 21.352760314941406, 22.18525505065918, 23.01774787902832]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 12.0, 10.0, 13.0, 15.0, 29.0, 29.0, 55.0, 84.0, 177.0, 474.0, 1673.0, 9361.0, 83854.0, 3887680.0, 191318.0, 15855.0, 2554.0, 596.0, 191.0, 88.0, 52.0, 39.0, 28.0, 21.0, 14.0, 10.0, 6.0, 6.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.9677734375, -23.185546875, -22.4033203125, -21.62109375, -20.8388671875, -20.056640625, -19.2744140625, -18.4921875, -17.7099609375, -16.927734375, -16.1455078125, -15.36328125, -14.5810546875, -13.798828125, -13.0166015625, -12.234375, -11.4521484375, -10.669921875, -9.8876953125, -9.10546875, -8.3232421875, -7.541015625, -6.7587890625, -5.9765625, -5.1943359375, -4.412109375, -3.6298828125, -2.84765625, -2.0654296875, -1.283203125, -0.5009765625, 0.28125, 1.0634765625, 1.845703125, 2.6279296875, 3.41015625, 4.1923828125, 4.974609375, 5.7568359375, 6.5390625, 7.3212890625, 8.103515625, 8.8857421875, 9.66796875, 10.4501953125, 11.232421875, 12.0146484375, 12.796875, 13.5791015625, 14.361328125, 15.1435546875, 15.92578125, 16.7080078125, 17.490234375, 18.2724609375, 19.0546875, 19.8369140625, 20.619140625, 21.4013671875, 22.18359375, 22.9658203125, 23.748046875, 24.5302734375, 25.3125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 7.0, 11.0, 9.0, 20.0, 25.0, 22.0, 30.0, 34.0, 41.0, 47.0, 51.0, 51.0, 55.0, 53.0, 56.0, 65.0, 52.0, 51.0, 49.0, 55.0, 34.0, 44.0, 25.0, 21.0, 15.0, 12.0, 8.0, 6.0, 8.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6770706176757812, -0.6554107666015625, -0.6337509155273438, -0.612091064453125, -0.5904312133789062, -0.5687713623046875, -0.5471115112304688, -0.52545166015625, -0.5037918090820312, -0.4821319580078125, -0.46047210693359375, -0.438812255859375, -0.41715240478515625, -0.3954925537109375, -0.37383270263671875, -0.3521728515625, -0.33051300048828125, -0.3088531494140625, -0.28719329833984375, -0.265533447265625, -0.24387359619140625, -0.2222137451171875, -0.20055389404296875, -0.17889404296875, -0.15723419189453125, -0.1355743408203125, -0.11391448974609375, -0.092254638671875, -0.07059478759765625, -0.0489349365234375, -0.02727508544921875, -0.005615234375, 0.01604461669921875, 0.0377044677734375, 0.05936431884765625, 0.081024169921875, 0.10268402099609375, 0.1243438720703125, 0.14600372314453125, 0.16766357421875, 0.18932342529296875, 0.2109832763671875, 0.23264312744140625, 0.254302978515625, 0.27596282958984375, 0.2976226806640625, 0.31928253173828125, 0.3409423828125, 0.36260223388671875, 0.3842620849609375, 0.40592193603515625, 0.427581787109375, 0.44924163818359375, 0.4709014892578125, 0.49256134033203125, 0.51422119140625, 0.5358810424804688, 0.5575408935546875, 0.5792007446289062, 0.600860595703125, 0.6225204467773438, 0.6441802978515625, 0.6658401489257812, 0.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 1.0, 7.0, 13.0, 19.0, 30.0, 52.0, 71.0, 103.0, 231.0, 414.0, 937.0, 2835.0, 10521.0, 53188.0, 454840.0, 3444234.0, 188032.0, 28805.0, 6365.0, 1926.0, 737.0, 388.0, 200.0, 119.0, 76.0, 54.0, 27.0, 23.0, 14.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.5, -15.955810546875, -15.41162109375, -14.867431640625, -14.3232421875, -13.779052734375, -13.23486328125, -12.690673828125, -12.146484375, -11.602294921875, -11.05810546875, -10.513916015625, -9.9697265625, -9.425537109375, -8.88134765625, -8.337158203125, -7.79296875, -7.248779296875, -6.70458984375, -6.160400390625, -5.6162109375, -5.072021484375, -4.52783203125, -3.983642578125, -3.439453125, -2.895263671875, -2.35107421875, -1.806884765625, -1.2626953125, -0.718505859375, -0.17431640625, 0.369873046875, 0.9140625, 1.458251953125, 2.00244140625, 2.546630859375, 3.0908203125, 3.635009765625, 4.17919921875, 4.723388671875, 5.267578125, 5.811767578125, 6.35595703125, 6.900146484375, 7.4443359375, 7.988525390625, 8.53271484375, 9.076904296875, 9.62109375, 10.165283203125, 10.70947265625, 11.253662109375, 11.7978515625, 12.342041015625, 12.88623046875, 13.430419921875, 13.974609375, 14.518798828125, 15.06298828125, 15.607177734375, 16.1513671875, 16.695556640625, 17.23974609375, 17.783935546875, 18.328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 6.0, 8.0, 5.0, 16.0, 17.0, 28.0, 21.0, 44.0, 58.0, 94.0, 139.0, 245.0, 443.0, 1516.0, 640.0, 246.0, 156.0, 113.0, 73.0, 56.0, 40.0, 27.0, 21.0, 25.0, 9.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.705078125, -1.62994384765625, -1.5548095703125, -1.47967529296875, -1.404541015625, -1.32940673828125, -1.2542724609375, -1.17913818359375, -1.10400390625, -1.02886962890625, -0.9537353515625, -0.87860107421875, -0.803466796875, -0.72833251953125, -0.6531982421875, -0.57806396484375, -0.5029296875, -0.42779541015625, -0.3526611328125, -0.27752685546875, -0.202392578125, -0.12725830078125, -0.0521240234375, 0.02301025390625, 0.09814453125, 0.17327880859375, 0.2484130859375, 0.32354736328125, 0.398681640625, 0.47381591796875, 0.5489501953125, 0.62408447265625, 0.69921875, 0.77435302734375, 0.8494873046875, 0.92462158203125, 0.999755859375, 1.07489013671875, 1.1500244140625, 1.22515869140625, 1.30029296875, 1.37542724609375, 1.4505615234375, 1.52569580078125, 1.600830078125, 1.67596435546875, 1.7510986328125, 1.82623291015625, 1.9013671875, 1.97650146484375, 2.0516357421875, 2.12677001953125, 2.201904296875, 2.27703857421875, 2.3521728515625, 2.42730712890625, 2.50244140625, 2.57757568359375, 2.6527099609375, 2.72784423828125, 2.802978515625, 2.87811279296875, 2.9532470703125, 3.02838134765625, 3.103515625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 22.0, 37.0, 59.0, 88.0, 115.0, 184.0, 157.0, 105.0, 78.0, 51.0, 25.0, 31.0, 15.0, 13.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.640647888183594, -22.01165771484375, -21.38266944885254, -20.753679275512695, -20.124691009521484, -19.49570083618164, -18.86671257019043, -18.237722396850586, -17.608734130859375, -16.97974395751953, -16.35075569152832, -15.721766471862793, -15.092777252197266, -14.463788032531738, -13.834798812866211, -13.205808639526367, -12.57681941986084, -11.947830200195312, -11.318840980529785, -10.689851760864258, -10.06086254119873, -9.431873321533203, -8.80288314819336, -8.173894882202148, -7.544905185699463, -6.9159159660339355, -6.286926746368408, -5.657937049865723, -5.028947830200195, -4.399958610534668, -3.7709693908691406, -3.1419801712036133, -2.512990951538086, -1.8840017318725586, -1.2550123929977417, -0.6260230541229248, 0.002966165542602539, 0.6319553852081299, 1.2609448432922363, 1.8899340629577637, 2.518923282623291, 3.1479125022888184, 3.7769017219543457, 4.405891418457031, 5.034880638122559, 5.663869857788086, 6.292859077453613, 6.921848297119141, 7.550837516784668, 8.179826736450195, 8.808815956115723, 9.43780517578125, 10.066794395446777, 10.695783615112305, 11.324773788452148, 11.95376205444336, 12.582752227783203, 13.21174144744873, 13.840730667114258, 14.469719886779785, 15.098709106445312, 15.72769832611084, 16.356687545776367, 16.98567771911621, 17.614665985107422]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 7.0, 7.0, 8.0, 11.0, 19.0, 21.0, 19.0, 16.0, 26.0, 26.0, 26.0, 31.0, 45.0, 35.0, 39.0, 36.0, 37.0, 44.0, 38.0, 36.0, 44.0, 42.0, 35.0, 37.0, 33.0, 34.0, 34.0, 27.0, 17.0, 32.0, 23.0, 11.0, 14.0, 19.0, 11.0, 10.0, 5.0, 5.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.466585159301758, -7.247486591339111, -7.028387546539307, -6.80928897857666, -6.5901899337768555, -6.371091365814209, -6.1519927978515625, -5.932893753051758, -5.713794708251953, -5.494696140289307, -5.275597095489502, -5.0564985275268555, -4.837399482727051, -4.618300914764404, -4.399202346801758, -4.180103302001953, -3.9610047340393066, -3.741905927658081, -3.5228071212768555, -3.303708553314209, -3.0846095085144043, -2.865510940551758, -2.6464121341705322, -2.4273133277893066, -2.208214521408081, -1.9891157150268555, -1.7700169086456299, -1.5509182214736938, -1.3318194150924683, -1.1127206087112427, -0.8936219215393066, -0.674523115158081, -0.45542430877685547, -0.23632553219795227, -0.017226755619049072, 0.20187199115753174, 0.4209707975387573, 0.6400696039199829, 0.859168291091919, 1.0782670974731445, 1.2973659038543701, 1.5164647102355957, 1.7355635166168213, 1.9546622037887573, 2.1737608909606934, 2.392859935760498, 2.6119585037231445, 2.83105731010437, 3.0501561164855957, 3.2692549228668213, 3.488353729248047, 3.7074522972106934, 3.926551342010498, 4.1456499099731445, 4.364748954772949, 4.583847522735596, 4.802946090698242, 5.022044658660889, 5.241143703460693, 5.46024227142334, 5.6793413162231445, 5.898439884185791, 6.1175384521484375, 6.336637496948242, 6.555736541748047]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 12.0, 18.0, 32.0, 28.0, 49.0, 83.0, 118.0, 172.0, 246.0, 417.0, 729.0, 1177.0, 2121.0, 3817.0, 6980.0, 13839.0, 27172.0, 54818.0, 108792.0, 198948.0, 258512.0, 178245.0, 95197.0, 47088.0, 23755.0, 11877.0, 6192.0, 3409.0, 1832.0, 1073.0, 699.0, 401.0, 214.0, 157.0, 97.0, 62.0, 42.0, 40.0, 24.0, 15.0, 23.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.16424560546875, -4.0316162109375, -3.89898681640625, -3.766357421875, -3.63372802734375, -3.5010986328125, -3.36846923828125, -3.23583984375, -3.10321044921875, -2.9705810546875, -2.83795166015625, -2.705322265625, -2.57269287109375, -2.4400634765625, -2.30743408203125, -2.1748046875, -2.04217529296875, -1.9095458984375, -1.77691650390625, -1.644287109375, -1.51165771484375, -1.3790283203125, -1.24639892578125, -1.11376953125, -0.98114013671875, -0.8485107421875, -0.71588134765625, -0.583251953125, -0.45062255859375, -0.3179931640625, -0.18536376953125, -0.052734375, 0.07989501953125, 0.2125244140625, 0.34515380859375, 0.477783203125, 0.61041259765625, 0.7430419921875, 0.87567138671875, 1.00830078125, 1.14093017578125, 1.2735595703125, 1.40618896484375, 1.538818359375, 1.67144775390625, 1.8040771484375, 1.93670654296875, 2.0693359375, 2.20196533203125, 2.3345947265625, 2.46722412109375, 2.599853515625, 2.73248291015625, 2.8651123046875, 2.99774169921875, 3.13037109375, 3.26300048828125, 3.3956298828125, 3.52825927734375, 3.660888671875, 3.79351806640625, 3.9261474609375, 4.05877685546875, 4.19140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 11.0, 12.0, 14.0, 26.0, 25.0, 33.0, 29.0, 43.0, 50.0, 57.0, 44.0, 55.0, 63.0, 78.0, 69.0, 69.0, 53.0, 73.0, 27.0, 36.0, 22.0, 33.0, 21.0, 16.0, 13.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8427734375, -0.8172683715820312, -0.7917633056640625, -0.7662582397460938, -0.740753173828125, -0.7152481079101562, -0.6897430419921875, -0.6642379760742188, -0.63873291015625, -0.6132278442382812, -0.5877227783203125, -0.5622177124023438, -0.536712646484375, -0.5112075805664062, -0.4857025146484375, -0.46019744873046875, -0.4346923828125, -0.40918731689453125, -0.3836822509765625, -0.35817718505859375, -0.332672119140625, -0.30716705322265625, -0.2816619873046875, -0.25615692138671875, -0.23065185546875, -0.20514678955078125, -0.1796417236328125, -0.15413665771484375, -0.128631591796875, -0.10312652587890625, -0.0776214599609375, -0.05211639404296875, -0.026611328125, -0.00110626220703125, 0.0243988037109375, 0.04990386962890625, 0.075408935546875, 0.10091400146484375, 0.1264190673828125, 0.15192413330078125, 0.17742919921875, 0.20293426513671875, 0.2284393310546875, 0.25394439697265625, 0.279449462890625, 0.30495452880859375, 0.3304595947265625, 0.35596466064453125, 0.3814697265625, 0.40697479248046875, 0.4324798583984375, 0.45798492431640625, 0.483489990234375, 0.5089950561523438, 0.5345001220703125, 0.5600051879882812, 0.58551025390625, 0.6110153198242188, 0.6365203857421875, 0.6620254516601562, 0.687530517578125, 0.7130355834960938, 0.7385406494140625, 0.7640457153320312, 0.78955078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 13.0, 13.0, 25.0, 29.0, 48.0, 70.0, 96.0, 140.0, 244.0, 414.0, 649.0, 1466.0, 4964.0, 29355.0, 250802.0, 621370.0, 118394.0, 14671.0, 3057.0, 1168.0, 577.0, 342.0, 210.0, 116.0, 87.0, 64.0, 50.0, 22.0, 9.0, 21.0, 14.0, 10.0, 4.0, 5.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.236083984375, -10.83935546875, -10.442626953125, -10.0458984375, -9.649169921875, -9.25244140625, -8.855712890625, -8.458984375, -8.062255859375, -7.66552734375, -7.268798828125, -6.8720703125, -6.475341796875, -6.07861328125, -5.681884765625, -5.28515625, -4.888427734375, -4.49169921875, -4.094970703125, -3.6982421875, -3.301513671875, -2.90478515625, -2.508056640625, -2.111328125, -1.714599609375, -1.31787109375, -0.921142578125, -0.5244140625, -0.127685546875, 0.26904296875, 0.665771484375, 1.0625, 1.459228515625, 1.85595703125, 2.252685546875, 2.6494140625, 3.046142578125, 3.44287109375, 3.839599609375, 4.236328125, 4.633056640625, 5.02978515625, 5.426513671875, 5.8232421875, 6.219970703125, 6.61669921875, 7.013427734375, 7.41015625, 7.806884765625, 8.20361328125, 8.600341796875, 8.9970703125, 9.393798828125, 9.79052734375, 10.187255859375, 10.583984375, 10.980712890625, 11.37744140625, 11.774169921875, 12.1708984375, 12.567626953125, 12.96435546875, 13.361083984375, 13.7578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 10.0, 4.0, 5.0, 12.0, 13.0, 20.0, 21.0, 11.0, 21.0, 17.0, 30.0, 32.0, 23.0, 37.0, 29.0, 40.0, 28.0, 32.0, 45.0, 34.0, 37.0, 42.0, 30.0, 23.0, 37.0, 35.0, 40.0, 30.0, 26.0, 23.0, 29.0, 17.0, 25.0, 18.0, 21.0, 19.0, 11.0, 9.0, 13.0, 2.0, 5.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.6953125, -2.603851318359375, -2.51239013671875, -2.420928955078125, -2.3294677734375, -2.238006591796875, -2.14654541015625, -2.055084228515625, -1.963623046875, -1.872161865234375, -1.78070068359375, -1.689239501953125, -1.5977783203125, -1.506317138671875, -1.41485595703125, -1.323394775390625, -1.23193359375, -1.140472412109375, -1.04901123046875, -0.957550048828125, -0.8660888671875, -0.774627685546875, -0.68316650390625, -0.591705322265625, -0.500244140625, -0.408782958984375, -0.31732177734375, -0.225860595703125, -0.1343994140625, -0.042938232421875, 0.04852294921875, 0.139984130859375, 0.2314453125, 0.322906494140625, 0.41436767578125, 0.505828857421875, 0.5972900390625, 0.688751220703125, 0.78021240234375, 0.871673583984375, 0.963134765625, 1.054595947265625, 1.14605712890625, 1.237518310546875, 1.3289794921875, 1.420440673828125, 1.51190185546875, 1.603363037109375, 1.69482421875, 1.786285400390625, 1.87774658203125, 1.969207763671875, 2.0606689453125, 2.152130126953125, 2.24359130859375, 2.335052490234375, 2.426513671875, 2.517974853515625, 2.60943603515625, 2.700897216796875, 2.7923583984375, 2.883819580078125, 2.97528076171875, 3.066741943359375, 3.158203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 15.0, 18.0, 29.0, 38.0, 52.0, 82.0, 114.0, 178.0, 275.0, 566.0, 931.0, 1796.0, 3783.0, 8710.0, 22786.0, 69000.0, 206756.0, 379512.0, 231592.0, 78169.0, 25704.0, 9893.0, 4119.0, 1979.0, 969.0, 543.0, 351.0, 162.0, 137.0, 74.0, 67.0, 41.0, 29.0, 15.0, 7.0, 6.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.922576904296875, -3.79827880859375, -3.673980712890625, -3.5496826171875, -3.425384521484375, -3.30108642578125, -3.176788330078125, -3.052490234375, -2.928192138671875, -2.80389404296875, -2.679595947265625, -2.5552978515625, -2.430999755859375, -2.30670166015625, -2.182403564453125, -2.05810546875, -1.933807373046875, -1.80950927734375, -1.685211181640625, -1.5609130859375, -1.436614990234375, -1.31231689453125, -1.188018798828125, -1.063720703125, -0.939422607421875, -0.81512451171875, -0.690826416015625, -0.5665283203125, -0.442230224609375, -0.31793212890625, -0.193634033203125, -0.0693359375, 0.054962158203125, 0.17926025390625, 0.303558349609375, 0.4278564453125, 0.552154541015625, 0.67645263671875, 0.800750732421875, 0.925048828125, 1.049346923828125, 1.17364501953125, 1.297943115234375, 1.4222412109375, 1.546539306640625, 1.67083740234375, 1.795135498046875, 1.91943359375, 2.043731689453125, 2.16802978515625, 2.292327880859375, 2.4166259765625, 2.540924072265625, 2.66522216796875, 2.789520263671875, 2.913818359375, 3.038116455078125, 3.16241455078125, 3.286712646484375, 3.4110107421875, 3.535308837890625, 3.65960693359375, 3.783905029296875, 3.908203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 11.0, 14.0, 20.0, 26.0, 40.0, 42.0, 74.0, 56.0, 79.0, 76.0, 91.0, 81.0, 68.0, 67.0, 53.0, 38.0, 24.0, 30.0, 24.0, 10.0, 9.0, 6.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004622936248779297, -0.00044478848576545715, -0.0004272833466529846, -0.0004097782075405121, -0.00039227306842803955, -0.000374767929315567, -0.0003572627902030945, -0.00033975765109062195, -0.0003222525119781494, -0.0003047473728656769, -0.00028724223375320435, -0.0002697370946407318, -0.0002522319555282593, -0.00023472681641578674, -0.0002172216773033142, -0.00019971653819084167, -0.00018221139907836914, -0.0001647062599658966, -0.00014720112085342407, -0.00012969598174095154, -0.000112190842628479, -9.468570351600647e-05, -7.718056440353394e-05, -5.96754252910614e-05, -4.217028617858887e-05, -2.4665147066116333e-05, -7.160007953643799e-06, 1.0345131158828735e-05, 2.785027027130127e-05, 4.5355409383773804e-05, 6.286054849624634e-05, 8.036568760871887e-05, 9.78708267211914e-05, 0.00011537596583366394, 0.00013288110494613647, 0.000150386244058609, 0.00016789138317108154, 0.00018539652228355408, 0.0002029016613960266, 0.00022040680050849915, 0.00023791193962097168, 0.0002554170787334442, 0.00027292221784591675, 0.0002904273569583893, 0.0003079324960708618, 0.00032543763518333435, 0.0003429427742958069, 0.0003604479134082794, 0.00037795305252075195, 0.0003954581916332245, 0.000412963330745697, 0.00043046846985816956, 0.0004479736089706421, 0.0004654787480831146, 0.00048298388719558716, 0.0005004890263080597, 0.0005179941654205322, 0.0005354993045330048, 0.0005530044436454773, 0.0005705095827579498, 0.0005880147218704224, 0.0006055198609828949, 0.0006230250000953674, 0.00064053013920784, 0.0006580352783203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 11.0, 12.0, 29.0, 38.0, 39.0, 108.0, 199.0, 353.0, 745.0, 1853.0, 6155.0, 30780.0, 304006.0, 614038.0, 74280.0, 11080.0, 2818.0, 1040.0, 440.0, 212.0, 116.0, 60.0, 43.0, 25.0, 22.0, 11.0, 3.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.533447265625, -8.23095703125, -7.928466796875, -7.6259765625, -7.323486328125, -7.02099609375, -6.718505859375, -6.416015625, -6.113525390625, -5.81103515625, -5.508544921875, -5.2060546875, -4.903564453125, -4.60107421875, -4.298583984375, -3.99609375, -3.693603515625, -3.39111328125, -3.088623046875, -2.7861328125, -2.483642578125, -2.18115234375, -1.878662109375, -1.576171875, -1.273681640625, -0.97119140625, -0.668701171875, -0.3662109375, -0.063720703125, 0.23876953125, 0.541259765625, 0.84375, 1.146240234375, 1.44873046875, 1.751220703125, 2.0537109375, 2.356201171875, 2.65869140625, 2.961181640625, 3.263671875, 3.566162109375, 3.86865234375, 4.171142578125, 4.4736328125, 4.776123046875, 5.07861328125, 5.381103515625, 5.68359375, 5.986083984375, 6.28857421875, 6.591064453125, 6.8935546875, 7.196044921875, 7.49853515625, 7.801025390625, 8.103515625, 8.406005859375, 8.70849609375, 9.010986328125, 9.3134765625, 9.615966796875, 9.91845703125, 10.220947265625, 10.5234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 3.0, 9.0, 19.0, 12.0, 20.0, 31.0, 30.0, 39.0, 50.0, 73.0, 76.0, 62.0, 92.0, 87.0, 72.0, 73.0, 54.0, 50.0, 29.0, 21.0, 21.0, 12.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.22265625, -4.12652587890625, -4.0303955078125, -3.93426513671875, -3.838134765625, -3.74200439453125, -3.6458740234375, -3.54974365234375, -3.45361328125, -3.35748291015625, -3.2613525390625, -3.16522216796875, -3.069091796875, -2.97296142578125, -2.8768310546875, -2.78070068359375, -2.6845703125, -2.58843994140625, -2.4923095703125, -2.39617919921875, -2.300048828125, -2.20391845703125, -2.1077880859375, -2.01165771484375, -1.91552734375, -1.81939697265625, -1.7232666015625, -1.62713623046875, -1.531005859375, -1.43487548828125, -1.3387451171875, -1.24261474609375, -1.146484375, -1.05035400390625, -0.9542236328125, -0.85809326171875, -0.761962890625, -0.66583251953125, -0.5697021484375, -0.47357177734375, -0.37744140625, -0.28131103515625, -0.1851806640625, -0.08905029296875, 0.007080078125, 0.10321044921875, 0.1993408203125, 0.29547119140625, 0.3916015625, 0.48773193359375, 0.5838623046875, 0.67999267578125, 0.776123046875, 0.87225341796875, 0.9683837890625, 1.06451416015625, 1.16064453125, 1.25677490234375, 1.3529052734375, 1.44903564453125, 1.545166015625, 1.64129638671875, 1.7374267578125, 1.83355712890625, 1.9296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 6.0, 5.0, 10.0, 30.0, 46.0, 82.0, 108.0, 167.0, 181.0, 131.0, 102.0, 57.0, 32.0, 15.0, 13.0, 7.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-69.88543701171875, -68.19379425048828, -66.50214385986328, -64.81050109863281, -63.11885070800781, -61.427207946777344, -59.73556137084961, -58.043914794921875, -56.35226821899414, -54.660621643066406, -52.96897506713867, -51.27732849121094, -49.58568572998047, -47.89403533935547, -46.202392578125, -44.510746002197266, -42.81909942626953, -41.1274528503418, -39.43580627441406, -37.74415969848633, -36.052513122558594, -34.360870361328125, -32.66922378540039, -30.977577209472656, -29.285930633544922, -27.594284057617188, -25.902637481689453, -24.21099281311035, -22.519346237182617, -20.827699661254883, -19.13605499267578, -17.444408416748047, -15.752761840820312, -14.061115264892578, -12.36946964263916, -10.677824020385742, -8.986177444458008, -7.294530868530273, -5.6028852462768555, -3.9112396240234375, -2.219593048095703, -0.527946949005127, 1.1636991500854492, 2.8553452491760254, 4.546991348266602, 6.238637924194336, 7.930283546447754, 9.621929168701172, 11.313575744628906, 13.00522232055664, 14.696867942810059, 16.388513565063477, 18.08016014099121, 19.771806716918945, 21.463451385498047, 23.15509796142578, 24.846744537353516, 26.53839111328125, 28.230037689208984, 29.921682357788086, 31.61332893371582, 33.30497741699219, 34.996620178222656, 36.68826675415039, 38.379913330078125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 17.0, 13.0, 19.0, 40.0, 39.0, 40.0, 57.0, 46.0, 53.0, 69.0, 66.0, 65.0, 62.0, 56.0, 60.0, 45.0, 46.0, 43.0, 31.0, 27.0, 22.0, 19.0, 14.0, 8.0, 9.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.39739227294922, -23.33258056640625, -22.26776695251465, -21.20295524597168, -20.138141632080078, -19.07332992553711, -18.00851821899414, -16.943706512451172, -15.87889289855957, -14.814080238342285, -13.749267578125, -12.684455871582031, -11.619643211364746, -10.554830551147461, -9.490018844604492, -8.425206184387207, -7.360393524169922, -6.295580863952637, -5.23076868057251, -4.165956497192383, -3.1011438369750977, -2.0363311767578125, -0.9715189933776855, 0.0932931900024414, 1.1581058502197266, 2.2229182720184326, 3.2877306938171387, 4.352542877197266, 5.417355537414551, 6.482168197631836, 7.546980381011963, 8.61179256439209, 9.676605224609375, 10.74141788482666, 11.806230545043945, 12.871042251586914, 13.9358549118042, 15.000667572021484, 16.065479278564453, 17.130290985107422, 18.195104598999023, 19.259916305541992, 20.324729919433594, 21.389541625976562, 22.45435333251953, 23.519166946411133, 24.5839786529541, 25.648792266845703, 26.713603973388672, 27.77841567993164, 28.843229293823242, 29.90804100036621, 30.972854614257812, 32.03766632080078, 33.10247802734375, 34.16728973388672, 35.23210144042969, 36.296913146972656, 37.361724853515625, 38.42654037475586, 39.49135208129883, 40.5561637878418, 41.620975494384766, 42.685787200927734, 43.75060272216797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 13.0, 30.0, 28.0, 51.0, 60.0, 82.0, 104.0, 177.0, 242.0, 366.0, 684.0, 1153.0, 2417.0, 5130.0, 12425.0, 36777.0, 160907.0, 3352730.0, 511934.0, 73300.0, 21152.0, 7682.0, 3185.0, 1506.0, 774.0, 490.0, 286.0, 166.0, 137.0, 77.0, 56.0, 45.0, 23.0, 20.0, 11.0, 14.0, 5.0, 7.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.6396484375, -9.326171875, -9.0126953125, -8.69921875, -8.3857421875, -8.072265625, -7.7587890625, -7.4453125, -7.1318359375, -6.818359375, -6.5048828125, -6.19140625, -5.8779296875, -5.564453125, -5.2509765625, -4.9375, -4.6240234375, -4.310546875, -3.9970703125, -3.68359375, -3.3701171875, -3.056640625, -2.7431640625, -2.4296875, -2.1162109375, -1.802734375, -1.4892578125, -1.17578125, -0.8623046875, -0.548828125, -0.2353515625, 0.078125, 0.3916015625, 0.705078125, 1.0185546875, 1.33203125, 1.6455078125, 1.958984375, 2.2724609375, 2.5859375, 2.8994140625, 3.212890625, 3.5263671875, 3.83984375, 4.1533203125, 4.466796875, 4.7802734375, 5.09375, 5.4072265625, 5.720703125, 6.0341796875, 6.34765625, 6.6611328125, 6.974609375, 7.2880859375, 7.6015625, 7.9150390625, 8.228515625, 8.5419921875, 8.85546875, 9.1689453125, 9.482421875, 9.7958984375, 10.109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 8.0, 12.0, 13.0, 8.0, 20.0, 14.0, 25.0, 15.0, 22.0, 23.0, 32.0, 30.0, 29.0, 38.0, 40.0, 44.0, 34.0, 53.0, 37.0, 50.0, 43.0, 44.0, 41.0, 44.0, 32.0, 32.0, 32.0, 27.0, 24.0, 23.0, 26.0, 18.0, 20.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.6031417846679688, -0.5832366943359375, -0.5633316040039062, -0.543426513671875, -0.5235214233398438, -0.5036163330078125, -0.48371124267578125, -0.46380615234375, -0.44390106201171875, -0.4239959716796875, -0.40409088134765625, -0.384185791015625, -0.36428070068359375, -0.3443756103515625, -0.32447052001953125, -0.3045654296875, -0.28466033935546875, -0.2647552490234375, -0.24485015869140625, -0.224945068359375, -0.20503997802734375, -0.1851348876953125, -0.16522979736328125, -0.14532470703125, -0.12541961669921875, -0.1055145263671875, -0.08560943603515625, -0.065704345703125, -0.04579925537109375, -0.0258941650390625, -0.00598907470703125, 0.013916015625, 0.03382110595703125, 0.0537261962890625, 0.07363128662109375, 0.093536376953125, 0.11344146728515625, 0.1333465576171875, 0.15325164794921875, 0.17315673828125, 0.19306182861328125, 0.2129669189453125, 0.23287200927734375, 0.252777099609375, 0.27268218994140625, 0.2925872802734375, 0.31249237060546875, 0.3323974609375, 0.35230255126953125, 0.3722076416015625, 0.39211273193359375, 0.412017822265625, 0.43192291259765625, 0.4518280029296875, 0.47173309326171875, 0.49163818359375, 0.5115432739257812, 0.5314483642578125, 0.5513534545898438, 0.571258544921875, 0.5911636352539062, 0.6110687255859375, 0.6309738159179688, 0.65087890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 7.0, 14.0, 17.0, 29.0, 30.0, 47.0, 58.0, 79.0, 159.0, 397.0, 965.0, 3461.0, 15458.0, 100457.0, 3002505.0, 987510.0, 67277.0, 11552.0, 2654.0, 769.0, 335.0, 173.0, 83.0, 61.0, 40.0, 33.0, 21.0, 24.0, 18.0, 11.0, 11.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.680419921875, -14.22021484375, -13.760009765625, -13.2998046875, -12.839599609375, -12.37939453125, -11.919189453125, -11.458984375, -10.998779296875, -10.53857421875, -10.078369140625, -9.6181640625, -9.157958984375, -8.69775390625, -8.237548828125, -7.77734375, -7.317138671875, -6.85693359375, -6.396728515625, -5.9365234375, -5.476318359375, -5.01611328125, -4.555908203125, -4.095703125, -3.635498046875, -3.17529296875, -2.715087890625, -2.2548828125, -1.794677734375, -1.33447265625, -0.874267578125, -0.4140625, 0.046142578125, 0.50634765625, 0.966552734375, 1.4267578125, 1.886962890625, 2.34716796875, 2.807373046875, 3.267578125, 3.727783203125, 4.18798828125, 4.648193359375, 5.1083984375, 5.568603515625, 6.02880859375, 6.489013671875, 6.94921875, 7.409423828125, 7.86962890625, 8.329833984375, 8.7900390625, 9.250244140625, 9.71044921875, 10.170654296875, 10.630859375, 11.091064453125, 11.55126953125, 12.011474609375, 12.4716796875, 12.931884765625, 13.39208984375, 13.852294921875, 14.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 8.0, 13.0, 10.0, 15.0, 14.0, 34.0, 32.0, 45.0, 64.0, 89.0, 97.0, 135.0, 241.0, 458.0, 1236.0, 567.0, 278.0, 191.0, 124.0, 95.0, 71.0, 50.0, 39.0, 39.0, 18.0, 18.0, 15.0, 9.0, 9.0, 10.0, 8.0, 7.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5693359375, -1.5146331787109375, -1.459930419921875, -1.4052276611328125, -1.35052490234375, -1.2958221435546875, -1.241119384765625, -1.1864166259765625, -1.1317138671875, -1.0770111083984375, -1.022308349609375, -0.9676055908203125, -0.91290283203125, -0.8582000732421875, -0.803497314453125, -0.7487945556640625, -0.694091796875, -0.6393890380859375, -0.584686279296875, -0.5299835205078125, -0.47528076171875, -0.4205780029296875, -0.365875244140625, -0.3111724853515625, -0.2564697265625, -0.2017669677734375, -0.147064208984375, -0.0923614501953125, -0.03765869140625, 0.0170440673828125, 0.071746826171875, 0.1264495849609375, 0.18115234375, 0.2358551025390625, 0.290557861328125, 0.3452606201171875, 0.39996337890625, 0.4546661376953125, 0.509368896484375, 0.5640716552734375, 0.6187744140625, 0.6734771728515625, 0.728179931640625, 0.7828826904296875, 0.83758544921875, 0.8922882080078125, 0.946990966796875, 1.0016937255859375, 1.056396484375, 1.1110992431640625, 1.165802001953125, 1.2205047607421875, 1.27520751953125, 1.3299102783203125, 1.384613037109375, 1.4393157958984375, 1.4940185546875, 1.5487213134765625, 1.603424072265625, 1.6581268310546875, 1.71282958984375, 1.7675323486328125, 1.822235107421875, 1.8769378662109375, 1.931640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 10.0, 48.0, 103.0, 194.0, 243.0, 212.0, 106.0, 49.0, 22.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.544408798217773, -14.5470552444458, -13.549701690673828, -12.552349090576172, -11.5549955368042, -10.557641983032227, -9.56028938293457, -8.562935829162598, -7.565582275390625, -6.568228721618652, -5.570875644683838, -4.573522567749023, -3.576169013977051, -2.578815460205078, -1.5814623832702637, -0.5841093063354492, 0.41324424743652344, 1.410597562789917, 2.4079508781433105, 3.405304193496704, 4.402657508850098, 5.40001106262207, 6.397364139556885, 7.394717216491699, 8.392070770263672, 9.389424324035645, 10.386777877807617, 11.384130477905273, 12.381484031677246, 13.378837585449219, 14.376190185546875, 15.373543739318848, 16.370899200439453, 17.36825180053711, 18.3656063079834, 19.362958908081055, 20.360313415527344, 21.357666015625, 22.355018615722656, 23.352371215820312, 24.3497257232666, 25.347078323364258, 26.344432830810547, 27.341785430908203, 28.33913803100586, 29.33649253845215, 30.333845138549805, 31.331199645996094, 32.32855224609375, 33.325904846191406, 34.32325744628906, 35.320613861083984, 36.31796646118164, 37.3153190612793, 38.31267166137695, 39.31002426147461, 40.30738067626953, 41.30473327636719, 42.302085876464844, 43.299442291259766, 44.29679489135742, 45.29414749145508, 46.291500091552734, 47.28885269165039, 48.28620529174805]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 8.0, 8.0, 15.0, 12.0, 16.0, 14.0, 24.0, 30.0, 31.0, 33.0, 43.0, 33.0, 50.0, 48.0, 42.0, 57.0, 44.0, 42.0, 47.0, 50.0, 46.0, 41.0, 37.0, 41.0, 21.0, 19.0, 23.0, 30.0, 19.0, 19.0, 11.0, 13.0, 10.0, 9.0, 6.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.305354595184326, -7.049162864685059, -6.792971134185791, -6.536779403686523, -6.280587196350098, -6.02439546585083, -5.7682037353515625, -5.512012004852295, -5.255820274353027, -4.99962854385376, -4.743436813354492, -4.487244606018066, -4.231052875518799, -3.9748611450195312, -3.7186694145202637, -3.462477684020996, -3.2062854766845703, -2.9500937461853027, -2.693901777267456, -2.4377100467681885, -2.181518077850342, -1.9253263473510742, -1.6691346168518066, -1.4129427671432495, -1.1567509174346924, -0.9005590677261353, -0.6443672776222229, -0.38817548751831055, -0.13198363780975342, 0.12420821189880371, 0.3803999423980713, 0.6365917921066284, 0.8927831649780273, 1.1489750146865845, 1.4051668643951416, 1.6613585948944092, 1.9175504446029663, 2.1737422943115234, 2.429934024810791, 2.6861257553100586, 2.9423177242279053, 3.198509454727173, 3.4547014236450195, 3.710893154144287, 3.9670848846435547, 4.2232770919799805, 4.47946834564209, 4.735660552978516, 4.991852283477783, 5.248044013977051, 5.504235744476318, 5.760427474975586, 6.016619682312012, 6.272811412811279, 6.529003143310547, 6.7851948738098145, 7.041386604309082, 7.29757833480835, 7.553770065307617, 7.809962272644043, 8.066153526306152, 8.322345733642578, 8.578536987304688, 8.834729194641113, 9.090921401977539]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 17.0, 14.0, 23.0, 45.0, 65.0, 85.0, 190.0, 298.0, 423.0, 743.0, 1192.0, 2097.0, 3695.0, 6571.0, 12119.0, 23180.0, 43364.0, 81095.0, 144999.0, 221055.0, 212815.0, 134346.0, 74296.0, 39144.0, 21088.0, 11302.0, 6120.0, 3322.0, 1892.0, 1139.0, 722.0, 425.0, 241.0, 139.0, 85.0, 69.0, 40.0, 30.0, 27.0, 7.0, 20.0, 10.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.0546875, -2.9453125, -2.8359375, -2.7265625, -2.6171875, -2.5078125, -2.3984375, -2.2890625, -2.1796875, -2.0703125, -1.9609375, -1.8515625, -1.7421875, -1.6328125, -1.5234375, -1.4140625, -1.3046875, -1.1953125, -1.0859375, -0.9765625, -0.8671875, -0.7578125, -0.6484375, -0.5390625, -0.4296875, -0.3203125, -0.2109375, -0.1015625, 0.0078125, 0.1171875, 0.2265625, 0.3359375, 0.4453125, 0.5546875, 0.6640625, 0.7734375, 0.8828125, 0.9921875, 1.1015625, 1.2109375, 1.3203125, 1.4296875, 1.5390625, 1.6484375, 1.7578125, 1.8671875, 1.9765625, 2.0859375, 2.1953125, 2.3046875, 2.4140625, 2.5234375, 2.6328125, 2.7421875, 2.8515625, 2.9609375, 3.0703125, 3.1796875, 3.2890625, 3.3984375, 3.5078125, 3.6171875, 3.7265625, 3.8359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 4.0, 6.0, 12.0, 9.0, 15.0, 19.0, 23.0, 17.0, 17.0, 28.0, 23.0, 32.0, 31.0, 37.0, 37.0, 37.0, 46.0, 38.0, 48.0, 50.0, 39.0, 43.0, 46.0, 36.0, 40.0, 33.0, 41.0, 29.0, 21.0, 26.0, 26.0, 21.0, 10.0, 9.0, 10.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6796875, -0.6588134765625, -0.637939453125, -0.6170654296875, -0.59619140625, -0.5753173828125, -0.554443359375, -0.5335693359375, -0.5126953125, -0.4918212890625, -0.470947265625, -0.4500732421875, -0.42919921875, -0.4083251953125, -0.387451171875, -0.3665771484375, -0.345703125, -0.3248291015625, -0.303955078125, -0.2830810546875, -0.26220703125, -0.2413330078125, -0.220458984375, -0.1995849609375, -0.1787109375, -0.1578369140625, -0.136962890625, -0.1160888671875, -0.09521484375, -0.0743408203125, -0.053466796875, -0.0325927734375, -0.01171875, 0.0091552734375, 0.030029296875, 0.0509033203125, 0.07177734375, 0.0926513671875, 0.113525390625, 0.1343994140625, 0.1552734375, 0.1761474609375, 0.197021484375, 0.2178955078125, 0.23876953125, 0.2596435546875, 0.280517578125, 0.3013916015625, 0.322265625, 0.3431396484375, 0.364013671875, 0.3848876953125, 0.40576171875, 0.4266357421875, 0.447509765625, 0.4683837890625, 0.4892578125, 0.5101318359375, 0.531005859375, 0.5518798828125, 0.57275390625, 0.5936279296875, 0.614501953125, 0.6353759765625, 0.65625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 8.0, 14.0, 20.0, 27.0, 35.0, 44.0, 59.0, 67.0, 113.0, 116.0, 165.0, 290.0, 410.0, 692.0, 1312.0, 3302.0, 11184.0, 47428.0, 211681.0, 499957.0, 208033.0, 45962.0, 10883.0, 3277.0, 1374.0, 704.0, 409.0, 286.0, 192.0, 133.0, 85.0, 71.0, 53.0, 34.0, 36.0, 25.0, 9.0, 15.0, 9.0, 7.0, 7.0, 4.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.91796875, -7.68841552734375, -7.4588623046875, -7.22930908203125, -6.999755859375, -6.77020263671875, -6.5406494140625, -6.31109619140625, -6.08154296875, -5.85198974609375, -5.6224365234375, -5.39288330078125, -5.163330078125, -4.93377685546875, -4.7042236328125, -4.47467041015625, -4.2451171875, -4.01556396484375, -3.7860107421875, -3.55645751953125, -3.326904296875, -3.09735107421875, -2.8677978515625, -2.63824462890625, -2.40869140625, -2.17913818359375, -1.9495849609375, -1.72003173828125, -1.490478515625, -1.26092529296875, -1.0313720703125, -0.80181884765625, -0.572265625, -0.34271240234375, -0.1131591796875, 0.11639404296875, 0.345947265625, 0.57550048828125, 0.8050537109375, 1.03460693359375, 1.26416015625, 1.49371337890625, 1.7232666015625, 1.95281982421875, 2.182373046875, 2.41192626953125, 2.6414794921875, 2.87103271484375, 3.1005859375, 3.33013916015625, 3.5596923828125, 3.78924560546875, 4.018798828125, 4.24835205078125, 4.4779052734375, 4.70745849609375, 4.93701171875, 5.16656494140625, 5.3961181640625, 5.62567138671875, 5.855224609375, 6.08477783203125, 6.3143310546875, 6.54388427734375, 6.7734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 4.0, 15.0, 15.0, 10.0, 16.0, 18.0, 17.0, 22.0, 27.0, 32.0, 28.0, 38.0, 24.0, 21.0, 48.0, 34.0, 37.0, 57.0, 33.0, 38.0, 49.0, 31.0, 35.0, 32.0, 30.0, 32.0, 32.0, 35.0, 28.0, 21.0, 23.0, 14.0, 16.0, 15.0, 10.0, 10.0, 12.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.261474609375, -3.15576171875, -3.050048828125, -2.9443359375, -2.838623046875, -2.73291015625, -2.627197265625, -2.521484375, -2.415771484375, -2.31005859375, -2.204345703125, -2.0986328125, -1.992919921875, -1.88720703125, -1.781494140625, -1.67578125, -1.570068359375, -1.46435546875, -1.358642578125, -1.2529296875, -1.147216796875, -1.04150390625, -0.935791015625, -0.830078125, -0.724365234375, -0.61865234375, -0.512939453125, -0.4072265625, -0.301513671875, -0.19580078125, -0.090087890625, 0.015625, 0.121337890625, 0.22705078125, 0.332763671875, 0.4384765625, 0.544189453125, 0.64990234375, 0.755615234375, 0.861328125, 0.967041015625, 1.07275390625, 1.178466796875, 1.2841796875, 1.389892578125, 1.49560546875, 1.601318359375, 1.70703125, 1.812744140625, 1.91845703125, 2.024169921875, 2.1298828125, 2.235595703125, 2.34130859375, 2.447021484375, 2.552734375, 2.658447265625, 2.76416015625, 2.869873046875, 2.9755859375, 3.081298828125, 3.18701171875, 3.292724609375, 3.3984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 6.0, 6.0, 11.0, 24.0, 34.0, 43.0, 75.0, 114.0, 217.0, 343.0, 684.0, 1418.0, 3207.0, 8920.0, 38089.0, 339529.0, 568204.0, 66759.0, 12880.0, 4200.0, 1829.0, 915.0, 444.0, 257.0, 147.0, 69.0, 36.0, 31.0, 18.0, 9.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.99566650390625, -4.8116455078125, -4.62762451171875, -4.443603515625, -4.25958251953125, -4.0755615234375, -3.89154052734375, -3.70751953125, -3.52349853515625, -3.3394775390625, -3.15545654296875, -2.971435546875, -2.78741455078125, -2.6033935546875, -2.41937255859375, -2.2353515625, -2.05133056640625, -1.8673095703125, -1.68328857421875, -1.499267578125, -1.31524658203125, -1.1312255859375, -0.94720458984375, -0.76318359375, -0.57916259765625, -0.3951416015625, -0.21112060546875, -0.027099609375, 0.15692138671875, 0.3409423828125, 0.52496337890625, 0.708984375, 0.89300537109375, 1.0770263671875, 1.26104736328125, 1.445068359375, 1.62908935546875, 1.8131103515625, 1.99713134765625, 2.18115234375, 2.36517333984375, 2.5491943359375, 2.73321533203125, 2.917236328125, 3.10125732421875, 3.2852783203125, 3.46929931640625, 3.6533203125, 3.83734130859375, 4.0213623046875, 4.20538330078125, 4.389404296875, 4.57342529296875, 4.7574462890625, 4.94146728515625, 5.12548828125, 5.30950927734375, 5.4935302734375, 5.67755126953125, 5.861572265625, 6.04559326171875, 6.2296142578125, 6.41363525390625, 6.59765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 11.0, 10.0, 23.0, 44.0, 61.0, 79.0, 150.0, 185.0, 158.0, 95.0, 63.0, 37.0, 29.0, 21.0, 7.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009832382202148438, -0.0009556189179420471, -0.0009279996156692505, -0.0009003803133964539, -0.0008727610111236572, -0.0008451417088508606, -0.000817522406578064, -0.0007899031043052673, -0.0007622838020324707, -0.0007346644997596741, -0.0007070451974868774, -0.0006794258952140808, -0.0006518065929412842, -0.0006241872906684875, -0.0005965679883956909, -0.0005689486861228943, -0.0005413293838500977, -0.000513710081577301, -0.0004860907793045044, -0.00045847147703170776, -0.00043085217475891113, -0.0004032328724861145, -0.00037561357021331787, -0.00034799426794052124, -0.0003203749656677246, -0.000292755663394928, -0.00026513636112213135, -0.00023751705884933472, -0.00020989775657653809, -0.00018227845430374146, -0.00015465915203094482, -0.0001270398497581482, -9.942054748535156e-05, -7.180124521255493e-05, -4.41819429397583e-05, -1.656264066696167e-05, 1.1056661605834961e-05, 3.867596387863159e-05, 6.629526615142822e-05, 9.391456842422485e-05, 0.00012153387069702148, 0.00014915317296981812, 0.00017677247524261475, 0.00020439177751541138, 0.000232011079788208, 0.00025963038206100464, 0.00028724968433380127, 0.0003148689866065979, 0.00034248828887939453, 0.00037010759115219116, 0.0003977268934249878, 0.0004253461956977844, 0.00045296549797058105, 0.0004805848002433777, 0.0005082041025161743, 0.000535823404788971, 0.0005634427070617676, 0.0005910620093345642, 0.0006186813116073608, 0.0006463006138801575, 0.0006739199161529541, 0.0007015392184257507, 0.0007291585206985474, 0.000756777822971344, 0.0007843971252441406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 15.0, 12.0, 16.0, 36.0, 70.0, 102.0, 240.0, 688.0, 2873.0, 20824.0, 713154.0, 296685.0, 10997.0, 1928.0, 495.0, 196.0, 81.0, 53.0, 31.0, 18.0, 15.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.4453125, -9.09375, -8.7421875, -8.390625, -8.0390625, -7.6875, -7.3359375, -6.984375, -6.6328125, -6.28125, -5.9296875, -5.578125, -5.2265625, -4.875, -4.5234375, -4.171875, -3.8203125, -3.46875, -3.1171875, -2.765625, -2.4140625, -2.0625, -1.7109375, -1.359375, -1.0078125, -0.65625, -0.3046875, 0.046875, 0.3984375, 0.75, 1.1015625, 1.453125, 1.8046875, 2.15625, 2.5078125, 2.859375, 3.2109375, 3.5625, 3.9140625, 4.265625, 4.6171875, 4.96875, 5.3203125, 5.671875, 6.0234375, 6.375, 6.7265625, 7.078125, 7.4296875, 7.78125, 8.1328125, 8.484375, 8.8359375, 9.1875, 9.5390625, 9.890625, 10.2421875, 10.59375, 10.9453125, 11.296875, 11.6484375, 12.0, 12.3515625, 12.703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 3.0, 6.0, 10.0, 9.0, 19.0, 29.0, 32.0, 48.0, 74.0, 108.0, 116.0, 121.0, 110.0, 76.0, 56.0, 44.0, 27.0, 34.0, 19.0, 11.0, 8.0, 6.0, 9.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.438690185546875, -2.33831787109375, -2.237945556640625, -2.1375732421875, -2.037200927734375, -1.93682861328125, -1.836456298828125, -1.736083984375, -1.635711669921875, -1.53533935546875, -1.434967041015625, -1.3345947265625, -1.234222412109375, -1.13385009765625, -1.033477783203125, -0.93310546875, -0.832733154296875, -0.73236083984375, -0.631988525390625, -0.5316162109375, -0.431243896484375, -0.33087158203125, -0.230499267578125, -0.130126953125, -0.029754638671875, 0.07061767578125, 0.170989990234375, 0.2713623046875, 0.371734619140625, 0.47210693359375, 0.572479248046875, 0.6728515625, 0.773223876953125, 0.87359619140625, 0.973968505859375, 1.0743408203125, 1.174713134765625, 1.27508544921875, 1.375457763671875, 1.475830078125, 1.576202392578125, 1.67657470703125, 1.776947021484375, 1.8773193359375, 1.977691650390625, 2.07806396484375, 2.178436279296875, 2.27880859375, 2.379180908203125, 2.47955322265625, 2.579925537109375, 2.6802978515625, 2.780670166015625, 2.88104248046875, 2.981414794921875, 3.081787109375, 3.182159423828125, 3.28253173828125, 3.382904052734375, 3.4832763671875, 3.583648681640625, 3.68402099609375, 3.784393310546875, 3.884765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 17.0, 22.0, 31.0, 70.0, 97.0, 123.0, 161.0, 140.0, 125.0, 74.0, 50.0, 21.0, 27.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.855499267578125, -31.468908309936523, -30.082319259643555, -28.695728302001953, -27.309139251708984, -25.922548294067383, -24.53595733642578, -23.149368286132812, -21.76277732849121, -20.37618637084961, -18.98959732055664, -17.60300636291504, -16.216415405273438, -14.829826354980469, -13.443235397338867, -12.056645393371582, -10.670055389404297, -9.283465385437012, -7.896874904632568, -6.510284423828125, -5.12369441986084, -3.7371044158935547, -2.350513458251953, -0.963923454284668, 0.4226665496826172, 1.8092567920684814, 3.1958470344543457, 4.582437515258789, 5.969027519226074, 7.355617523193359, 8.742208480834961, 10.128798484802246, 11.515388488769531, 12.901978492736816, 14.288568496704102, 15.675159454345703, 17.061748504638672, 18.448339462280273, 19.834930419921875, 21.221519470214844, 22.608110427856445, 23.994701385498047, 25.381290435791016, 26.767881393432617, 28.15447235107422, 29.541061401367188, 30.92765235900879, 32.31424331665039, 33.70083236694336, 35.08742141723633, 36.47401428222656, 37.86060333251953, 39.2471923828125, 40.63378143310547, 42.0203742980957, 43.40696334838867, 44.793556213378906, 46.180145263671875, 47.56673812866211, 48.95332717895508, 50.33991622924805, 51.72650909423828, 53.11309814453125, 54.49968719482422, 55.88627624511719]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 7.0, 11.0, 13.0, 10.0, 11.0, 12.0, 22.0, 20.0, 18.0, 21.0, 28.0, 30.0, 35.0, 47.0, 44.0, 38.0, 49.0, 39.0, 42.0, 32.0, 41.0, 51.0, 35.0, 48.0, 32.0, 29.0, 27.0, 22.0, 31.0, 20.0, 23.0, 19.0, 14.0, 11.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-23.02880096435547, -22.35460662841797, -21.6804141998291, -21.0062198638916, -20.332027435302734, -19.657833099365234, -18.983638763427734, -18.309446334838867, -17.635251998901367, -16.961057662963867, -16.286865234375, -15.6126708984375, -14.938477516174316, -14.264284133911133, -13.59009075164795, -12.915897369384766, -12.241703987121582, -11.567510604858398, -10.893317222595215, -10.219123840332031, -9.544929504394531, -8.870736122131348, -8.196542739868164, -7.522348880767822, -6.848155498504639, -6.173962116241455, -5.499768257141113, -4.82557487487793, -4.151381492614746, -3.4771876335144043, -2.8029942512512207, -2.128800392150879, -1.4546070098876953, -0.7804134488105774, -0.10621988773345947, 0.5679736137390137, 1.2421672344207764, 1.916360855102539, 2.5905542373657227, 3.2647480964660645, 3.938941478729248, 4.613134860992432, 5.287328720092773, 5.961522102355957, 6.635715484619141, 7.309909343719482, 7.984102725982666, 8.658296585083008, 9.332489967346191, 10.006683349609375, 10.680876731872559, 11.355070114135742, 12.029264450073242, 12.703457832336426, 13.37765121459961, 14.05184555053711, 14.726037979125977, 15.40023136138916, 16.074424743652344, 16.748619079589844, 17.42281150817871, 18.09700584411621, 18.771198272705078, 19.445392608642578, 20.119586944580078]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 11.0, 14.0, 33.0, 39.0, 57.0, 78.0, 138.0, 174.0, 287.0, 501.0, 951.0, 1664.0, 3143.0, 6645.0, 15279.0, 41244.0, 153486.0, 3237716.0, 596100.0, 86653.0, 28208.0, 11372.0, 5077.0, 2440.0, 1253.0, 624.0, 403.0, 242.0, 163.0, 87.0, 65.0, 40.0, 27.0, 16.0, 12.0, 8.0, 10.0, 4.0, 0.0, 3.0], "bins": [-8.109375, -7.9154052734375, -7.721435546875, -7.5274658203125, -7.33349609375, -7.1395263671875, -6.945556640625, -6.7515869140625, -6.5576171875, -6.3636474609375, -6.169677734375, -5.9757080078125, -5.78173828125, -5.5877685546875, -5.393798828125, -5.1998291015625, -5.005859375, -4.8118896484375, -4.617919921875, -4.4239501953125, -4.22998046875, -4.0360107421875, -3.842041015625, -3.6480712890625, -3.4541015625, -3.2601318359375, -3.066162109375, -2.8721923828125, -2.67822265625, -2.4842529296875, -2.290283203125, -2.0963134765625, -1.90234375, -1.7083740234375, -1.514404296875, -1.3204345703125, -1.12646484375, -0.9324951171875, -0.738525390625, -0.5445556640625, -0.3505859375, -0.1566162109375, 0.037353515625, 0.2313232421875, 0.42529296875, 0.6192626953125, 0.813232421875, 1.0072021484375, 1.201171875, 1.3951416015625, 1.589111328125, 1.7830810546875, 1.97705078125, 2.1710205078125, 2.364990234375, 2.5589599609375, 2.7529296875, 2.9468994140625, 3.140869140625, 3.3348388671875, 3.52880859375, 3.7227783203125, 3.916748046875, 4.1107177734375, 4.3046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 4.0, 18.0, 14.0, 15.0, 29.0, 32.0, 24.0, 34.0, 37.0, 50.0, 62.0, 63.0, 69.0, 61.0, 69.0, 57.0, 60.0, 63.0, 40.0, 38.0, 31.0, 27.0, 20.0, 22.0, 20.0, 8.0, 8.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01953125, -0.9907302856445312, -0.9619293212890625, -0.9331283569335938, -0.904327392578125, -0.8755264282226562, -0.8467254638671875, -0.8179244995117188, -0.78912353515625, -0.7603225708007812, -0.7315216064453125, -0.7027206420898438, -0.673919677734375, -0.6451187133789062, -0.6163177490234375, -0.5875167846679688, -0.5587158203125, -0.5299148559570312, -0.5011138916015625, -0.47231292724609375, -0.443511962890625, -0.41471099853515625, -0.3859100341796875, -0.35710906982421875, -0.32830810546875, -0.29950714111328125, -0.2707061767578125, -0.24190521240234375, -0.213104248046875, -0.18430328369140625, -0.1555023193359375, -0.12670135498046875, -0.097900390625, -0.06909942626953125, -0.0402984619140625, -0.01149749755859375, 0.017303466796875, 0.04610443115234375, 0.0749053955078125, 0.10370635986328125, 0.13250732421875, 0.16130828857421875, 0.1901092529296875, 0.21891021728515625, 0.247711181640625, 0.27651214599609375, 0.3053131103515625, 0.33411407470703125, 0.3629150390625, 0.39171600341796875, 0.4205169677734375, 0.44931793212890625, 0.478118896484375, 0.5069198608398438, 0.5357208251953125, 0.5645217895507812, 0.59332275390625, 0.6221237182617188, 0.6509246826171875, 0.6797256469726562, 0.708526611328125, 0.7373275756835938, 0.7661285400390625, 0.7949295043945312, 0.82373046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 10.0, 17.0, 19.0, 24.0, 22.0, 59.0, 80.0, 185.0, 324.0, 625.0, 1475.0, 3552.0, 8773.0, 25107.0, 83844.0, 431145.0, 3218446.0, 319852.0, 68435.0, 20301.0, 7123.0, 2725.0, 1107.0, 491.0, 250.0, 108.0, 67.0, 38.0, 27.0, 15.0, 14.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.38836669921875, -6.1712646484375, -5.95416259765625, -5.737060546875, -5.51995849609375, -5.3028564453125, -5.08575439453125, -4.86865234375, -4.65155029296875, -4.4344482421875, -4.21734619140625, -4.000244140625, -3.78314208984375, -3.5660400390625, -3.34893798828125, -3.1318359375, -2.91473388671875, -2.6976318359375, -2.48052978515625, -2.263427734375, -2.04632568359375, -1.8292236328125, -1.61212158203125, -1.39501953125, -1.17791748046875, -0.9608154296875, -0.74371337890625, -0.526611328125, -0.30950927734375, -0.0924072265625, 0.12469482421875, 0.341796875, 0.55889892578125, 0.7760009765625, 0.99310302734375, 1.210205078125, 1.42730712890625, 1.6444091796875, 1.86151123046875, 2.07861328125, 2.29571533203125, 2.5128173828125, 2.72991943359375, 2.947021484375, 3.16412353515625, 3.3812255859375, 3.59832763671875, 3.8154296875, 4.03253173828125, 4.2496337890625, 4.46673583984375, 4.683837890625, 4.90093994140625, 5.1180419921875, 5.33514404296875, 5.55224609375, 5.76934814453125, 5.9864501953125, 6.20355224609375, 6.420654296875, 6.63775634765625, 6.8548583984375, 7.07196044921875, 7.2890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 3.0, 6.0, 15.0, 14.0, 23.0, 24.0, 21.0, 43.0, 35.0, 55.0, 52.0, 92.0, 103.0, 174.0, 285.0, 559.0, 1242.0, 439.0, 224.0, 167.0, 105.0, 95.0, 65.0, 55.0, 37.0, 27.0, 15.0, 13.0, 14.0, 12.0, 14.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4091796875, -1.3656158447265625, -1.322052001953125, -1.2784881591796875, -1.23492431640625, -1.1913604736328125, -1.147796630859375, -1.1042327880859375, -1.0606689453125, -1.0171051025390625, -0.973541259765625, -0.9299774169921875, -0.88641357421875, -0.8428497314453125, -0.799285888671875, -0.7557220458984375, -0.712158203125, -0.6685943603515625, -0.625030517578125, -0.5814666748046875, -0.53790283203125, -0.4943389892578125, -0.450775146484375, -0.4072113037109375, -0.3636474609375, -0.3200836181640625, -0.276519775390625, -0.2329559326171875, -0.18939208984375, -0.1458282470703125, -0.102264404296875, -0.0587005615234375, -0.01513671875, 0.0284271240234375, 0.071990966796875, 0.1155548095703125, 0.15911865234375, 0.2026824951171875, 0.246246337890625, 0.2898101806640625, 0.3333740234375, 0.3769378662109375, 0.420501708984375, 0.4640655517578125, 0.50762939453125, 0.5511932373046875, 0.594757080078125, 0.6383209228515625, 0.681884765625, 0.7254486083984375, 0.769012451171875, 0.8125762939453125, 0.85614013671875, 0.8997039794921875, 0.943267822265625, 0.9868316650390625, 1.0303955078125, 1.0739593505859375, 1.117523193359375, 1.1610870361328125, 1.20465087890625, 1.2482147216796875, 1.291778564453125, 1.3353424072265625, 1.37890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 15.0, 69.0, 215.0, 363.0, 239.0, 71.0, 17.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.0728759765625, -61.87200164794922, -60.67112731933594, -59.47025680541992, -58.26938247680664, -57.06850814819336, -55.86763381958008, -54.6667594909668, -53.46588897705078, -52.2650146484375, -51.06414031982422, -49.8632698059082, -48.66239547729492, -47.46152114868164, -46.26064682006836, -45.05977249145508, -43.8588981628418, -42.658023834228516, -41.457149505615234, -40.25627899169922, -39.05540466308594, -37.854530334472656, -36.653656005859375, -35.452781677246094, -34.25190734863281, -33.05103302001953, -31.850160598754883, -30.6492862701416, -29.448413848876953, -28.247539520263672, -27.04666519165039, -25.84579086303711, -24.644916534423828, -23.444042205810547, -22.2431697845459, -21.042295455932617, -19.84142303466797, -18.640548706054688, -17.439674377441406, -16.238800048828125, -15.037927627563477, -13.837054252624512, -12.636180877685547, -11.435306549072266, -10.2344331741333, -9.033559799194336, -7.832685947418213, -6.63181209564209, -5.430938720703125, -4.23006534576416, -3.029191493988037, -1.8283178806304932, -0.6274442672729492, 0.5734291076660156, 1.7743029594421387, 2.9751768112182617, 4.176050186157227, 5.376923561096191, 6.5777974128723145, 7.7786712646484375, 8.979544639587402, 10.180418014526367, 11.381292343139648, 12.582165718078613, 13.783039093017578]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 18.0, 17.0, 18.0, 17.0, 20.0, 28.0, 35.0, 42.0, 37.0, 48.0, 48.0, 45.0, 54.0, 46.0, 57.0, 47.0, 56.0, 60.0, 39.0, 39.0, 28.0, 28.0, 24.0, 15.0, 18.0, 22.0, 13.0, 13.0, 9.0, 9.0, 9.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.536355972290039, -5.313342094421387, -5.090328693389893, -4.86731481552124, -4.644301414489746, -4.421287536621094, -4.1982741355896, -3.9752602577209473, -3.752246856689453, -3.52923321723938, -3.3062195777893066, -3.0832059383392334, -2.86019229888916, -2.637178421020508, -2.4141650199890137, -2.1911511421203613, -1.968137502670288, -1.7451238632202148, -1.5221102237701416, -1.2990965843200684, -1.0760829448699951, -0.8530691862106323, -0.6300555467605591, -0.40704190731048584, -0.1840282678604126, 0.03898538649082184, 0.2619990408420563, 0.4850127100944519, 0.7080263495445251, 0.9310400485992432, 1.1540536880493164, 1.3770673274993896, 1.600080966949463, 1.8230946063995361, 2.0461082458496094, 2.2691218852996826, 2.492135524749756, 2.715149402618408, 2.9381628036499023, 3.1611766815185547, 3.384190082550049, 3.607203722000122, 3.8302173614501953, 4.053231239318848, 4.276244640350342, 4.499258518218994, 4.722271919250488, 4.945285797119141, 5.168299674987793, 5.391313552856445, 5.6143269538879395, 5.837340831756592, 6.060354232788086, 6.283368110656738, 6.506381511688232, 6.729395389556885, 6.952408790588379, 7.175422668457031, 7.398436069488525, 7.621449947357178, 7.844463348388672, 8.067477226257324, 8.290491104125977, 8.513504028320312, 8.736517906188965]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 8.0, 1.0, 8.0, 6.0, 11.0, 15.0, 10.0, 19.0, 19.0, 37.0, 42.0, 57.0, 81.0, 137.0, 171.0, 259.0, 356.0, 510.0, 783.0, 1186.0, 1915.0, 3201.0, 5588.0, 11076.0, 22741.0, 49097.0, 106615.0, 212611.0, 277742.0, 183645.0, 88725.0, 40343.0, 19248.0, 9479.0, 5011.0, 2780.0, 1705.0, 1006.0, 695.0, 499.0, 287.0, 255.0, 176.0, 104.0, 79.0, 65.0, 52.0, 22.0, 27.0, 13.0, 14.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0], "bins": [-3.875, -3.7589111328125, -3.642822265625, -3.5267333984375, -3.41064453125, -3.2945556640625, -3.178466796875, -3.0623779296875, -2.9462890625, -2.8302001953125, -2.714111328125, -2.5980224609375, -2.48193359375, -2.3658447265625, -2.249755859375, -2.1336669921875, -2.017578125, -1.9014892578125, -1.785400390625, -1.6693115234375, -1.55322265625, -1.4371337890625, -1.321044921875, -1.2049560546875, -1.0888671875, -0.9727783203125, -0.856689453125, -0.7406005859375, -0.62451171875, -0.5084228515625, -0.392333984375, -0.2762451171875, -0.16015625, -0.0440673828125, 0.072021484375, 0.1881103515625, 0.30419921875, 0.4202880859375, 0.536376953125, 0.6524658203125, 0.7685546875, 0.8846435546875, 1.000732421875, 1.1168212890625, 1.23291015625, 1.3489990234375, 1.465087890625, 1.5811767578125, 1.697265625, 1.8133544921875, 1.929443359375, 2.0455322265625, 2.16162109375, 2.2777099609375, 2.393798828125, 2.5098876953125, 2.6259765625, 2.7420654296875, 2.858154296875, 2.9742431640625, 3.09033203125, 3.2064208984375, 3.322509765625, 3.4385986328125, 3.5546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 12.0, 8.0, 10.0, 19.0, 9.0, 14.0, 17.0, 25.0, 26.0, 26.0, 34.0, 36.0, 33.0, 42.0, 48.0, 45.0, 55.0, 76.0, 60.0, 51.0, 40.0, 34.0, 42.0, 31.0, 27.0, 40.0, 30.0, 22.0, 20.0, 20.0, 19.0, 6.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.661224365234375, -0.63690185546875, -0.612579345703125, -0.5882568359375, -0.563934326171875, -0.53961181640625, -0.515289306640625, -0.490966796875, -0.466644287109375, -0.44232177734375, -0.417999267578125, -0.3936767578125, -0.369354248046875, -0.34503173828125, -0.320709228515625, -0.29638671875, -0.272064208984375, -0.24774169921875, -0.223419189453125, -0.1990966796875, -0.174774169921875, -0.15045166015625, -0.126129150390625, -0.101806640625, -0.077484130859375, -0.05316162109375, -0.028839111328125, -0.0045166015625, 0.019805908203125, 0.04412841796875, 0.068450927734375, 0.0927734375, 0.117095947265625, 0.14141845703125, 0.165740966796875, 0.1900634765625, 0.214385986328125, 0.23870849609375, 0.263031005859375, 0.287353515625, 0.311676025390625, 0.33599853515625, 0.360321044921875, 0.3846435546875, 0.408966064453125, 0.43328857421875, 0.457611083984375, 0.48193359375, 0.506256103515625, 0.53057861328125, 0.554901123046875, 0.5792236328125, 0.603546142578125, 0.62786865234375, 0.652191162109375, 0.676513671875, 0.700836181640625, 0.72515869140625, 0.749481201171875, 0.7738037109375, 0.798126220703125, 0.82244873046875, 0.846771240234375, 0.87109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 17.0, 10.0, 21.0, 16.0, 27.0, 44.0, 50.0, 58.0, 93.0, 147.0, 196.0, 245.0, 349.0, 483.0, 754.0, 1419.0, 3173.0, 8422.0, 27874.0, 102809.0, 327727.0, 382724.0, 136441.0, 36481.0, 10717.0, 3778.0, 1639.0, 940.0, 514.0, 365.0, 240.0, 204.0, 151.0, 109.0, 73.0, 61.0, 47.0, 32.0, 27.0, 24.0, 16.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.24609375, -5.08270263671875, -4.9193115234375, -4.75592041015625, -4.592529296875, -4.42913818359375, -4.2657470703125, -4.10235595703125, -3.93896484375, -3.77557373046875, -3.6121826171875, -3.44879150390625, -3.285400390625, -3.12200927734375, -2.9586181640625, -2.79522705078125, -2.6318359375, -2.46844482421875, -2.3050537109375, -2.14166259765625, -1.978271484375, -1.81488037109375, -1.6514892578125, -1.48809814453125, -1.32470703125, -1.16131591796875, -0.9979248046875, -0.83453369140625, -0.671142578125, -0.50775146484375, -0.3443603515625, -0.18096923828125, -0.017578125, 0.14581298828125, 0.3092041015625, 0.47259521484375, 0.635986328125, 0.79937744140625, 0.9627685546875, 1.12615966796875, 1.28955078125, 1.45294189453125, 1.6163330078125, 1.77972412109375, 1.943115234375, 2.10650634765625, 2.2698974609375, 2.43328857421875, 2.5966796875, 2.76007080078125, 2.9234619140625, 3.08685302734375, 3.250244140625, 3.41363525390625, 3.5770263671875, 3.74041748046875, 3.90380859375, 4.06719970703125, 4.2305908203125, 4.39398193359375, 4.557373046875, 4.72076416015625, 4.8841552734375, 5.04754638671875, 5.2109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 12.0, 7.0, 12.0, 14.0, 13.0, 13.0, 19.0, 19.0, 35.0, 26.0, 27.0, 35.0, 25.0, 38.0, 44.0, 57.0, 38.0, 41.0, 51.0, 31.0, 38.0, 46.0, 38.0, 38.0, 39.0, 34.0, 35.0, 30.0, 21.0, 36.0, 15.0, 12.0, 19.0, 6.0, 7.0, 4.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.498046875, -3.394775390625, -3.29150390625, -3.188232421875, -3.0849609375, -2.981689453125, -2.87841796875, -2.775146484375, -2.671875, -2.568603515625, -2.46533203125, -2.362060546875, -2.2587890625, -2.155517578125, -2.05224609375, -1.948974609375, -1.845703125, -1.742431640625, -1.63916015625, -1.535888671875, -1.4326171875, -1.329345703125, -1.22607421875, -1.122802734375, -1.01953125, -0.916259765625, -0.81298828125, -0.709716796875, -0.6064453125, -0.503173828125, -0.39990234375, -0.296630859375, -0.193359375, -0.090087890625, 0.01318359375, 0.116455078125, 0.2197265625, 0.322998046875, 0.42626953125, 0.529541015625, 0.6328125, 0.736083984375, 0.83935546875, 0.942626953125, 1.0458984375, 1.149169921875, 1.25244140625, 1.355712890625, 1.458984375, 1.562255859375, 1.66552734375, 1.768798828125, 1.8720703125, 1.975341796875, 2.07861328125, 2.181884765625, 2.28515625, 2.388427734375, 2.49169921875, 2.594970703125, 2.6982421875, 2.801513671875, 2.90478515625, 3.008056640625, 3.111328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 14.0, 24.0, 44.0, 57.0, 119.0, 188.0, 358.0, 782.0, 1981.0, 5878.0, 24234.0, 145849.0, 587807.0, 231853.0, 36666.0, 8161.0, 2513.0, 1024.0, 436.0, 232.0, 118.0, 65.0, 46.0, 15.0, 22.0, 8.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.640869140625, -3.52197265625, -3.403076171875, -3.2841796875, -3.165283203125, -3.04638671875, -2.927490234375, -2.80859375, -2.689697265625, -2.57080078125, -2.451904296875, -2.3330078125, -2.214111328125, -2.09521484375, -1.976318359375, -1.857421875, -1.738525390625, -1.61962890625, -1.500732421875, -1.3818359375, -1.262939453125, -1.14404296875, -1.025146484375, -0.90625, -0.787353515625, -0.66845703125, -0.549560546875, -0.4306640625, -0.311767578125, -0.19287109375, -0.073974609375, 0.044921875, 0.163818359375, 0.28271484375, 0.401611328125, 0.5205078125, 0.639404296875, 0.75830078125, 0.877197265625, 0.99609375, 1.114990234375, 1.23388671875, 1.352783203125, 1.4716796875, 1.590576171875, 1.70947265625, 1.828369140625, 1.947265625, 2.066162109375, 2.18505859375, 2.303955078125, 2.4228515625, 2.541748046875, 2.66064453125, 2.779541015625, 2.8984375, 3.017333984375, 3.13623046875, 3.255126953125, 3.3740234375, 3.492919921875, 3.61181640625, 3.730712890625, 3.849609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 3.0, 10.0, 3.0, 6.0, 7.0, 13.0, 11.0, 20.0, 22.0, 34.0, 26.0, 39.0, 42.0, 58.0, 85.0, 80.0, 87.0, 89.0, 70.0, 62.0, 39.0, 36.0, 26.0, 22.0, 18.0, 10.0, 9.0, 9.0, 12.0, 7.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003113746643066406, -0.00030067190527915955, -0.00028996914625167847, -0.0002792663872241974, -0.0002685636281967163, -0.00025786086916923523, -0.00024715811014175415, -0.00023645535111427307, -0.000225752592086792, -0.0002150498330593109, -0.00020434707403182983, -0.00019364431500434875, -0.00018294155597686768, -0.0001722387969493866, -0.00016153603792190552, -0.00015083327889442444, -0.00014013051986694336, -0.00012942776083946228, -0.0001187250018119812, -0.00010802224278450012, -9.731948375701904e-05, -8.661672472953796e-05, -7.591396570205688e-05, -6.52112066745758e-05, -5.4508447647094727e-05, -4.380568861961365e-05, -3.310292959213257e-05, -2.240017056465149e-05, -1.169741153717041e-05, -9.94652509689331e-07, 9.708106517791748e-06, 2.0410865545272827e-05, 3.1113624572753906e-05, 4.1816383600234985e-05, 5.2519142627716064e-05, 6.322190165519714e-05, 7.392466068267822e-05, 8.46274197101593e-05, 9.533017873764038e-05, 0.00010603293776512146, 0.00011673569679260254, 0.00012743845582008362, 0.0001381412148475647, 0.00014884397387504578, 0.00015954673290252686, 0.00017024949193000793, 0.00018095225095748901, 0.0001916550099849701, 0.00020235776901245117, 0.00021306052803993225, 0.00022376328706741333, 0.0002344660460948944, 0.0002451688051223755, 0.00025587156414985657, 0.00026657432317733765, 0.0002772770822048187, 0.0002879798412322998, 0.0002986826002597809, 0.00030938535928726196, 0.00032008811831474304, 0.0003307908773422241, 0.0003414936363697052, 0.0003521963953971863, 0.00036289915442466736, 0.00037360191345214844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 6.0, 12.0, 10.0, 22.0, 36.0, 42.0, 66.0, 120.0, 205.0, 388.0, 605.0, 1296.0, 3058.0, 9377.0, 42068.0, 273489.0, 571352.0, 116205.0, 20554.0, 5396.0, 2045.0, 960.0, 485.0, 290.0, 182.0, 85.0, 69.0, 29.0, 22.0, 22.0, 15.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.47100830078125, -3.3482666015625, -3.22552490234375, -3.102783203125, -2.98004150390625, -2.8572998046875, -2.73455810546875, -2.61181640625, -2.48907470703125, -2.3663330078125, -2.24359130859375, -2.120849609375, -1.99810791015625, -1.8753662109375, -1.75262451171875, -1.6298828125, -1.50714111328125, -1.3843994140625, -1.26165771484375, -1.138916015625, -1.01617431640625, -0.8934326171875, -0.77069091796875, -0.64794921875, -0.52520751953125, -0.4024658203125, -0.27972412109375, -0.156982421875, -0.03424072265625, 0.0885009765625, 0.21124267578125, 0.333984375, 0.45672607421875, 0.5794677734375, 0.70220947265625, 0.824951171875, 0.94769287109375, 1.0704345703125, 1.19317626953125, 1.31591796875, 1.43865966796875, 1.5614013671875, 1.68414306640625, 1.806884765625, 1.92962646484375, 2.0523681640625, 2.17510986328125, 2.2978515625, 2.42059326171875, 2.5433349609375, 2.66607666015625, 2.788818359375, 2.91156005859375, 3.0343017578125, 3.15704345703125, 3.27978515625, 3.40252685546875, 3.5252685546875, 3.64801025390625, 3.770751953125, 3.89349365234375, 4.0162353515625, 4.13897705078125, 4.26171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 14.0, 5.0, 18.0, 18.0, 26.0, 30.0, 27.0, 30.0, 70.0, 69.0, 79.0, 70.0, 95.0, 95.0, 81.0, 69.0, 58.0, 40.0, 30.0, 19.0, 18.0, 8.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.608673095703125, -1.53570556640625, -1.462738037109375, -1.3897705078125, -1.316802978515625, -1.24383544921875, -1.170867919921875, -1.097900390625, -1.024932861328125, -0.95196533203125, -0.878997802734375, -0.8060302734375, -0.733062744140625, -0.66009521484375, -0.587127685546875, -0.51416015625, -0.441192626953125, -0.36822509765625, -0.295257568359375, -0.2222900390625, -0.149322509765625, -0.07635498046875, -0.003387451171875, 0.069580078125, 0.142547607421875, 0.21551513671875, 0.288482666015625, 0.3614501953125, 0.434417724609375, 0.50738525390625, 0.580352783203125, 0.6533203125, 0.726287841796875, 0.79925537109375, 0.872222900390625, 0.9451904296875, 1.018157958984375, 1.09112548828125, 1.164093017578125, 1.237060546875, 1.310028076171875, 1.38299560546875, 1.455963134765625, 1.5289306640625, 1.601898193359375, 1.67486572265625, 1.747833251953125, 1.82080078125, 1.893768310546875, 1.96673583984375, 2.039703369140625, 2.1126708984375, 2.185638427734375, 2.25860595703125, 2.331573486328125, 2.404541015625, 2.477508544921875, 2.55047607421875, 2.623443603515625, 2.6964111328125, 2.769378662109375, 2.84234619140625, 2.915313720703125, 2.98828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 10.0, 24.0, 48.0, 89.0, 161.0, 203.0, 210.0, 126.0, 59.0, 36.0, 16.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.85749816894531, -59.107975006103516, -57.35844802856445, -55.608924865722656, -53.859397888183594, -52.1098747253418, -50.3603515625, -48.61082458496094, -46.86130142211914, -45.111778259277344, -43.36225128173828, -41.612728118896484, -39.86320114135742, -38.113677978515625, -36.36415100097656, -34.614627838134766, -32.86510467529297, -31.11557960510254, -29.36605453491211, -27.616531372070312, -25.867006301879883, -24.117481231689453, -22.367956161499023, -20.618431091308594, -18.86890411376953, -17.1193790435791, -15.369854927062988, -13.620329856872559, -11.870805740356445, -10.121280670166016, -8.371755599975586, -6.622231483459473, -4.872707366943359, -3.123182773590088, -1.3736579418182373, 0.3758668899536133, 2.1253914833068848, 3.8749160766601562, 5.624441146850586, 7.373965263366699, 9.123490333557129, 10.873015403747559, 12.622539520263672, 14.372064590454102, 16.12158966064453, 17.871112823486328, 19.62063980102539, 21.370162963867188, 23.119688034057617, 24.869213104248047, 26.618738174438477, 28.368263244628906, 30.117786407470703, 31.867311477661133, 33.61683654785156, 35.36635971069336, 37.11588668823242, 38.86540985107422, 40.61493682861328, 42.36445999145508, 44.11398696899414, 45.86351013183594, 47.613037109375, 49.3625602722168, 51.112083435058594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 16.0, 16.0, 18.0, 27.0, 22.0, 30.0, 23.0, 42.0, 56.0, 55.0, 57.0, 49.0, 66.0, 60.0, 64.0, 53.0, 41.0, 34.0, 48.0, 25.0, 40.0, 25.0, 22.0, 12.0, 16.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.422504425048828, -24.69485855102539, -23.967212677001953, -23.239564895629883, -22.511919021606445, -21.784273147583008, -21.05662727355957, -20.3289794921875, -19.601333618164062, -18.873687744140625, -18.146041870117188, -17.418394088745117, -16.69074821472168, -15.963102340698242, -15.235456466674805, -14.50780963897705, -13.780163764953613, -13.052517890930176, -12.324871063232422, -11.597225189208984, -10.86957836151123, -10.141932487487793, -9.414285659790039, -8.686639785766602, -7.958993434906006, -7.23134708404541, -6.5037007331848145, -5.776054382324219, -5.048408508300781, -4.320761680603027, -3.59311580657959, -2.865469455718994, -2.1378231048583984, -1.4101767539978027, -0.6825305223464966, 0.04511570930480957, 0.7727620601654053, 1.500408411026001, 2.2280545234680176, 2.9557008743286133, 3.683347225189209, 4.410993576049805, 5.1386399269104, 5.866286277770996, 6.593932151794434, 7.3215789794921875, 8.049224853515625, 8.776870727539062, 9.504517555236816, 10.232163429260254, 10.959810256958008, 11.687456130981445, 12.4151029586792, 13.142748832702637, 13.87039566040039, 14.598041534423828, 15.325687408447266, 16.053333282470703, 16.78097915649414, 17.50862693786621, 18.23627281188965, 18.963918685913086, 19.691564559936523, 20.419212341308594, 21.14685821533203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 10.0, 14.0, 27.0, 35.0, 34.0, 64.0, 87.0, 121.0, 204.0, 288.0, 412.0, 637.0, 1063.0, 1704.0, 2785.0, 4774.0, 8729.0, 16250.0, 33438.0, 75294.0, 209098.0, 1350362.0, 2105453.0, 226856.0, 81283.0, 35584.0, 17593.0, 9263.0, 5105.0, 3067.0, 1708.0, 1049.0, 665.0, 417.0, 274.0, 174.0, 106.0, 92.0, 42.0, 32.0, 16.0, 17.0, 18.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4375, -3.32305908203125, -3.2086181640625, -3.09417724609375, -2.979736328125, -2.86529541015625, -2.7508544921875, -2.63641357421875, -2.52197265625, -2.40753173828125, -2.2930908203125, -2.17864990234375, -2.064208984375, -1.94976806640625, -1.8353271484375, -1.72088623046875, -1.6064453125, -1.49200439453125, -1.3775634765625, -1.26312255859375, -1.148681640625, -1.03424072265625, -0.9197998046875, -0.80535888671875, -0.69091796875, -0.57647705078125, -0.4620361328125, -0.34759521484375, -0.233154296875, -0.11871337890625, -0.0042724609375, 0.11016845703125, 0.224609375, 0.33905029296875, 0.4534912109375, 0.56793212890625, 0.682373046875, 0.79681396484375, 0.9112548828125, 1.02569580078125, 1.14013671875, 1.25457763671875, 1.3690185546875, 1.48345947265625, 1.597900390625, 1.71234130859375, 1.8267822265625, 1.94122314453125, 2.0556640625, 2.17010498046875, 2.2845458984375, 2.39898681640625, 2.513427734375, 2.62786865234375, 2.7423095703125, 2.85675048828125, 2.97119140625, 3.08563232421875, 3.2000732421875, 3.31451416015625, 3.428955078125, 3.54339599609375, 3.6578369140625, 3.77227783203125, 3.88671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 6.0, 8.0, 12.0, 10.0, 18.0, 12.0, 19.0, 17.0, 31.0, 19.0, 27.0, 31.0, 34.0, 43.0, 43.0, 47.0, 43.0, 47.0, 44.0, 57.0, 36.0, 54.0, 46.0, 31.0, 25.0, 32.0, 39.0, 32.0, 26.0, 19.0, 11.0, 16.0, 11.0, 10.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.705078125, -0.6837310791015625, -0.662384033203125, -0.6410369873046875, -0.61968994140625, -0.5983428955078125, -0.576995849609375, -0.5556488037109375, -0.5343017578125, -0.5129547119140625, -0.491607666015625, -0.4702606201171875, -0.44891357421875, -0.4275665283203125, -0.406219482421875, -0.3848724365234375, -0.363525390625, -0.3421783447265625, -0.320831298828125, -0.2994842529296875, -0.27813720703125, -0.2567901611328125, -0.235443115234375, -0.2140960693359375, -0.1927490234375, -0.1714019775390625, -0.150054931640625, -0.1287078857421875, -0.10736083984375, -0.0860137939453125, -0.064666748046875, -0.0433197021484375, -0.02197265625, -0.0006256103515625, 0.020721435546875, 0.0420684814453125, 0.06341552734375, 0.0847625732421875, 0.106109619140625, 0.1274566650390625, 0.1488037109375, 0.1701507568359375, 0.191497802734375, 0.2128448486328125, 0.23419189453125, 0.2555389404296875, 0.276885986328125, 0.2982330322265625, 0.319580078125, 0.3409271240234375, 0.362274169921875, 0.3836212158203125, 0.40496826171875, 0.4263153076171875, 0.447662353515625, 0.4690093994140625, 0.4903564453125, 0.5117034912109375, 0.533050537109375, 0.5543975830078125, 0.57574462890625, 0.5970916748046875, 0.618438720703125, 0.6397857666015625, 0.6611328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 17.0, 24.0, 26.0, 50.0, 73.0, 101.0, 182.0, 284.0, 563.0, 1133.0, 2827.0, 7949.0, 27065.0, 118538.0, 949563.0, 2811153.0, 212407.0, 43364.0, 11885.0, 3983.0, 1527.0, 704.0, 309.0, 189.0, 107.0, 83.0, 34.0, 30.0, 27.0, 7.0, 15.0, 7.0, 9.0, 3.0, 4.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.4609375, -7.254638671875, -7.04833984375, -6.842041015625, -6.6357421875, -6.429443359375, -6.22314453125, -6.016845703125, -5.810546875, -5.604248046875, -5.39794921875, -5.191650390625, -4.9853515625, -4.779052734375, -4.57275390625, -4.366455078125, -4.16015625, -3.953857421875, -3.74755859375, -3.541259765625, -3.3349609375, -3.128662109375, -2.92236328125, -2.716064453125, -2.509765625, -2.303466796875, -2.09716796875, -1.890869140625, -1.6845703125, -1.478271484375, -1.27197265625, -1.065673828125, -0.859375, -0.653076171875, -0.44677734375, -0.240478515625, -0.0341796875, 0.172119140625, 0.37841796875, 0.584716796875, 0.791015625, 0.997314453125, 1.20361328125, 1.409912109375, 1.6162109375, 1.822509765625, 2.02880859375, 2.235107421875, 2.44140625, 2.647705078125, 2.85400390625, 3.060302734375, 3.2666015625, 3.472900390625, 3.67919921875, 3.885498046875, 4.091796875, 4.298095703125, 4.50439453125, 4.710693359375, 4.9169921875, 5.123291015625, 5.32958984375, 5.535888671875, 5.7421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 15.0, 12.0, 17.0, 21.0, 28.0, 48.0, 61.0, 94.0, 128.0, 204.0, 267.0, 616.0, 1210.0, 465.0, 283.0, 168.0, 123.0, 74.0, 65.0, 50.0, 28.0, 21.0, 18.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.4273681640625, -2.356689453125, -2.2860107421875, -2.21533203125, -2.1446533203125, -2.073974609375, -2.0032958984375, -1.9326171875, -1.8619384765625, -1.791259765625, -1.7205810546875, -1.64990234375, -1.5792236328125, -1.508544921875, -1.4378662109375, -1.3671875, -1.2965087890625, -1.225830078125, -1.1551513671875, -1.08447265625, -1.0137939453125, -0.943115234375, -0.8724365234375, -0.8017578125, -0.7310791015625, -0.660400390625, -0.5897216796875, -0.51904296875, -0.4483642578125, -0.377685546875, -0.3070068359375, -0.236328125, -0.1656494140625, -0.094970703125, -0.0242919921875, 0.04638671875, 0.1170654296875, 0.187744140625, 0.2584228515625, 0.3291015625, 0.3997802734375, 0.470458984375, 0.5411376953125, 0.61181640625, 0.6824951171875, 0.753173828125, 0.8238525390625, 0.89453125, 0.9652099609375, 1.035888671875, 1.1065673828125, 1.17724609375, 1.2479248046875, 1.318603515625, 1.3892822265625, 1.4599609375, 1.5306396484375, 1.601318359375, 1.6719970703125, 1.74267578125, 1.8133544921875, 1.884033203125, 1.9547119140625, 2.025390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 20.0, 26.0, 71.0, 139.0, 178.0, 193.0, 157.0, 105.0, 51.0, 26.0, 18.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.428184509277344, -19.50799560546875, -18.587806701660156, -17.667617797851562, -16.747426986694336, -15.827238082885742, -14.907049179077148, -13.986860275268555, -13.066671371459961, -12.146482467651367, -11.226292610168457, -10.306103706359863, -9.38591480255127, -8.46572494506836, -7.545536041259766, -6.625347137451172, -5.705157279968262, -4.78496789932251, -3.864778995513916, -2.944589614868164, -2.024400472640991, -1.1042113304138184, -0.1840219497680664, 0.7361669540405273, 1.6563563346862793, 2.576545476913452, 3.496734619140625, 4.416923999786377, 5.337113380432129, 6.257302284240723, 7.177491664886475, 8.097681045532227, 9.01786994934082, 9.938058853149414, 10.858248710632324, 11.778437614440918, 12.698626518249512, 13.618816375732422, 14.539005279541016, 15.45919418334961, 16.379383087158203, 17.299571990966797, 18.21976089477539, 19.139949798583984, 20.06014060974121, 20.980329513549805, 21.9005184173584, 22.820707321166992, 23.74089813232422, 24.661087036132812, 25.581275939941406, 26.50146484375, 27.421655654907227, 28.34184455871582, 29.262033462524414, 30.182222366333008, 31.1024112701416, 32.02260208129883, 32.94279098510742, 33.862979888916016, 34.78316879272461, 35.7033576965332, 36.6235466003418, 37.54373550415039, 38.463924407958984]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 7.0, 4.0, 12.0, 9.0, 16.0, 16.0, 19.0, 20.0, 26.0, 30.0, 31.0, 45.0, 29.0, 40.0, 36.0, 39.0, 35.0, 35.0, 39.0, 50.0, 38.0, 46.0, 36.0, 44.0, 37.0, 35.0, 29.0, 22.0, 24.0, 19.0, 22.0, 15.0, 13.0, 14.0, 11.0, 9.0, 9.0, 6.0, 1.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.7333598136901855, -7.492978096008301, -7.252595901489258, -7.012214183807373, -6.771832466125488, -6.531450271606445, -6.2910685539245605, -6.050686836242676, -5.810304641723633, -5.569922924041748, -5.329540729522705, -5.08915901184082, -4.848776817321777, -4.608395099639893, -4.368013381958008, -4.127631187438965, -3.88724946975708, -3.646867513656616, -3.4064855575561523, -3.1661038398742676, -2.9257218837738037, -2.68533992767334, -2.444958209991455, -2.204576253890991, -1.9641942977905273, -1.7238123416900635, -1.4834305047988892, -1.2430486679077148, -1.002666711807251, -0.7622847557067871, -0.5219029188156128, -0.2815210819244385, -0.041138648986816406, 0.19924324750900269, 0.4396251440048218, 0.6800070405006409, 0.92038893699646, 1.1607708930969238, 1.4011527299880981, 1.6415345668792725, 1.8819165229797363, 2.1222984790802, 2.362680435180664, 2.603062152862549, 2.8434441089630127, 3.0838260650634766, 3.3242077827453613, 3.564589738845825, 3.804971694946289, 4.045353412628174, 4.285735607147217, 4.526117324829102, 4.7664995193481445, 5.006881237030029, 5.247262954711914, 5.487645149230957, 5.728026866912842, 5.968408584594727, 6.2087907791137695, 6.449172496795654, 6.689554214477539, 6.929936408996582, 7.170318126678467, 7.410699844360352, 7.6510820388793945]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 5.0, 2.0, 8.0, 11.0, 14.0, 22.0, 34.0, 54.0, 78.0, 98.0, 165.0, 280.0, 456.0, 724.0, 1348.0, 2500.0, 4895.0, 10118.0, 22152.0, 49362.0, 110492.0, 242045.0, 312929.0, 158749.0, 71635.0, 31879.0, 14215.0, 6704.0, 3324.0, 1692.0, 999.0, 603.0, 341.0, 226.0, 147.0, 95.0, 53.0, 24.0, 20.0, 16.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89080810546875, -3.7620849609375, -3.63336181640625, -3.504638671875, -3.37591552734375, -3.2471923828125, -3.11846923828125, -2.98974609375, -2.86102294921875, -2.7322998046875, -2.60357666015625, -2.474853515625, -2.34613037109375, -2.2174072265625, -2.08868408203125, -1.9599609375, -1.83123779296875, -1.7025146484375, -1.57379150390625, -1.445068359375, -1.31634521484375, -1.1876220703125, -1.05889892578125, -0.93017578125, -0.80145263671875, -0.6727294921875, -0.54400634765625, -0.415283203125, -0.28656005859375, -0.1578369140625, -0.02911376953125, 0.099609375, 0.22833251953125, 0.3570556640625, 0.48577880859375, 0.614501953125, 0.74322509765625, 0.8719482421875, 1.00067138671875, 1.12939453125, 1.25811767578125, 1.3868408203125, 1.51556396484375, 1.644287109375, 1.77301025390625, 1.9017333984375, 2.03045654296875, 2.1591796875, 2.28790283203125, 2.4166259765625, 2.54534912109375, 2.674072265625, 2.80279541015625, 2.9315185546875, 3.06024169921875, 3.18896484375, 3.31768798828125, 3.4464111328125, 3.57513427734375, 3.703857421875, 3.83258056640625, 3.9613037109375, 4.09002685546875, 4.21875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 8.0, 11.0, 9.0, 13.0, 14.0, 17.0, 20.0, 22.0, 25.0, 21.0, 40.0, 40.0, 33.0, 51.0, 38.0, 52.0, 53.0, 52.0, 48.0, 51.0, 47.0, 47.0, 32.0, 32.0, 24.0, 35.0, 26.0, 23.0, 27.0, 20.0, 15.0, 5.0, 8.0, 5.0, 4.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7138671875, -0.6916122436523438, -0.6693572998046875, -0.6471023559570312, -0.624847412109375, -0.6025924682617188, -0.5803375244140625, -0.5580825805664062, -0.53582763671875, -0.5135726928710938, -0.4913177490234375, -0.46906280517578125, -0.446807861328125, -0.42455291748046875, -0.4022979736328125, -0.38004302978515625, -0.3577880859375, -0.33553314208984375, -0.3132781982421875, -0.29102325439453125, -0.268768310546875, -0.24651336669921875, -0.2242584228515625, -0.20200347900390625, -0.17974853515625, -0.15749359130859375, -0.1352386474609375, -0.11298370361328125, -0.090728759765625, -0.06847381591796875, -0.0462188720703125, -0.02396392822265625, -0.001708984375, 0.02054595947265625, 0.0428009033203125, 0.06505584716796875, 0.087310791015625, 0.10956573486328125, 0.1318206787109375, 0.15407562255859375, 0.17633056640625, 0.19858551025390625, 0.2208404541015625, 0.24309539794921875, 0.265350341796875, 0.28760528564453125, 0.3098602294921875, 0.33211517333984375, 0.3543701171875, 0.37662506103515625, 0.3988800048828125, 0.42113494873046875, 0.443389892578125, 0.46564483642578125, 0.4878997802734375, 0.5101547241210938, 0.53240966796875, 0.5546646118164062, 0.5769195556640625, 0.5991744995117188, 0.621429443359375, 0.6436843872070312, 0.6659393310546875, 0.6881942749023438, 0.71044921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 17.0, 11.0, 20.0, 29.0, 35.0, 64.0, 64.0, 82.0, 140.0, 185.0, 286.0, 359.0, 602.0, 956.0, 1832.0, 3978.0, 9071.0, 22401.0, 57299.0, 144686.0, 325712.0, 282937.0, 117576.0, 46562.0, 18496.0, 7493.0, 3364.0, 1674.0, 862.0, 541.0, 338.0, 232.0, 205.0, 120.0, 77.0, 62.0, 54.0, 33.0, 25.0, 20.0, 13.0, 8.0, 2.0, 8.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.482421875, -3.36590576171875, -3.2493896484375, -3.13287353515625, -3.016357421875, -2.89984130859375, -2.7833251953125, -2.66680908203125, -2.55029296875, -2.43377685546875, -2.3172607421875, -2.20074462890625, -2.084228515625, -1.96771240234375, -1.8511962890625, -1.73468017578125, -1.6181640625, -1.50164794921875, -1.3851318359375, -1.26861572265625, -1.152099609375, -1.03558349609375, -0.9190673828125, -0.80255126953125, -0.68603515625, -0.56951904296875, -0.4530029296875, -0.33648681640625, -0.219970703125, -0.10345458984375, 0.0130615234375, 0.12957763671875, 0.24609375, 0.36260986328125, 0.4791259765625, 0.59564208984375, 0.712158203125, 0.82867431640625, 0.9451904296875, 1.06170654296875, 1.17822265625, 1.29473876953125, 1.4112548828125, 1.52777099609375, 1.644287109375, 1.76080322265625, 1.8773193359375, 1.99383544921875, 2.1103515625, 2.22686767578125, 2.3433837890625, 2.45989990234375, 2.576416015625, 2.69293212890625, 2.8094482421875, 2.92596435546875, 3.04248046875, 3.15899658203125, 3.2755126953125, 3.39202880859375, 3.508544921875, 3.62506103515625, 3.7415771484375, 3.85809326171875, 3.974609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 9.0, 5.0, 12.0, 11.0, 10.0, 19.0, 19.0, 15.0, 17.0, 33.0, 31.0, 38.0, 23.0, 29.0, 30.0, 38.0, 45.0, 30.0, 42.0, 47.0, 42.0, 37.0, 42.0, 42.0, 43.0, 36.0, 27.0, 30.0, 32.0, 23.0, 27.0, 17.0, 19.0, 16.0, 15.0, 13.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.091796875, -3.000823974609375, -2.90985107421875, -2.818878173828125, -2.7279052734375, -2.636932373046875, -2.54595947265625, -2.454986572265625, -2.364013671875, -2.273040771484375, -2.18206787109375, -2.091094970703125, -2.0001220703125, -1.909149169921875, -1.81817626953125, -1.727203369140625, -1.63623046875, -1.545257568359375, -1.45428466796875, -1.363311767578125, -1.2723388671875, -1.181365966796875, -1.09039306640625, -0.999420166015625, -0.908447265625, -0.817474365234375, -0.72650146484375, -0.635528564453125, -0.5445556640625, -0.453582763671875, -0.36260986328125, -0.271636962890625, -0.1806640625, -0.089691162109375, 0.00128173828125, 0.092254638671875, 0.1832275390625, 0.274200439453125, 0.36517333984375, 0.456146240234375, 0.547119140625, 0.638092041015625, 0.72906494140625, 0.820037841796875, 0.9110107421875, 1.001983642578125, 1.09295654296875, 1.183929443359375, 1.27490234375, 1.365875244140625, 1.45684814453125, 1.547821044921875, 1.6387939453125, 1.729766845703125, 1.82073974609375, 1.911712646484375, 2.002685546875, 2.093658447265625, 2.18463134765625, 2.275604248046875, 2.3665771484375, 2.457550048828125, 2.54852294921875, 2.639495849609375, 2.73046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 9.0, 2.0, 2.0, 8.0, 10.0, 12.0, 19.0, 13.0, 26.0, 39.0, 64.0, 91.0, 126.0, 203.0, 348.0, 527.0, 999.0, 1930.0, 4522.0, 13534.0, 55554.0, 291554.0, 515514.0, 124073.0, 25645.0, 7455.0, 2897.0, 1389.0, 739.0, 442.0, 289.0, 170.0, 120.0, 67.0, 53.0, 30.0, 24.0, 20.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.20703125, -3.107574462890625, -3.00811767578125, -2.908660888671875, -2.8092041015625, -2.709747314453125, -2.61029052734375, -2.510833740234375, -2.411376953125, -2.311920166015625, -2.21246337890625, -2.113006591796875, -2.0135498046875, -1.914093017578125, -1.81463623046875, -1.715179443359375, -1.61572265625, -1.516265869140625, -1.41680908203125, -1.317352294921875, -1.2178955078125, -1.118438720703125, -1.01898193359375, -0.919525146484375, -0.820068359375, -0.720611572265625, -0.62115478515625, -0.521697998046875, -0.4222412109375, -0.322784423828125, -0.22332763671875, -0.123870849609375, -0.0244140625, 0.075042724609375, 0.17449951171875, 0.273956298828125, 0.3734130859375, 0.472869873046875, 0.57232666015625, 0.671783447265625, 0.771240234375, 0.870697021484375, 0.97015380859375, 1.069610595703125, 1.1690673828125, 1.268524169921875, 1.36798095703125, 1.467437744140625, 1.56689453125, 1.666351318359375, 1.76580810546875, 1.865264892578125, 1.9647216796875, 2.064178466796875, 2.16363525390625, 2.263092041015625, 2.362548828125, 2.462005615234375, 2.56146240234375, 2.660919189453125, 2.7603759765625, 2.859832763671875, 2.95928955078125, 3.058746337890625, 3.158203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 5.0, 13.0, 9.0, 18.0, 12.0, 24.0, 17.0, 19.0, 26.0, 39.0, 50.0, 82.0, 109.0, 107.0, 108.0, 72.0, 54.0, 47.0, 32.0, 26.0, 22.0, 20.0, 13.0, 12.0, 13.0, 3.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003070831298828125, -0.0002958737313747406, -0.0002846643328666687, -0.0002734549343585968, -0.0002622455358505249, -0.000251036137342453, -0.0002398267388343811, -0.0002286173403263092, -0.0002174079418182373, -0.0002061985433101654, -0.0001949891448020935, -0.0001837797462940216, -0.0001725703477859497, -0.0001613609492778778, -0.0001501515507698059, -0.000138942152261734, -0.0001277327537536621, -0.00011652335524559021, -0.00010531395673751831, -9.410455822944641e-05, -8.289515972137451e-05, -7.168576121330261e-05, -6.047636270523071e-05, -4.9266964197158813e-05, -3.8057565689086914e-05, -2.6848167181015015e-05, -1.5638768672943115e-05, -4.429370164871216e-06, 6.780028343200684e-06, 1.7989426851272583e-05, 2.9198825359344482e-05, 4.040822386741638e-05, 5.161762237548828e-05, 6.282702088356018e-05, 7.403641939163208e-05, 8.524581789970398e-05, 9.645521640777588e-05, 0.00010766461491584778, 0.00011887401342391968, 0.00013008341193199158, 0.00014129281044006348, 0.00015250220894813538, 0.00016371160745620728, 0.00017492100596427917, 0.00018613040447235107, 0.00019733980298042297, 0.00020854920148849487, 0.00021975859999656677, 0.00023096799850463867, 0.00024217739701271057, 0.00025338679552078247, 0.00026459619402885437, 0.00027580559253692627, 0.00028701499104499817, 0.00029822438955307007, 0.00030943378806114197, 0.00032064318656921387, 0.00033185258507728577, 0.00034306198358535767, 0.00035427138209342957, 0.00036548078060150146, 0.00037669017910957336, 0.00038789957761764526, 0.00039910897612571716, 0.00041031837463378906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 18.0, 16.0, 20.0, 29.0, 46.0, 86.0, 120.0, 250.0, 460.0, 938.0, 2035.0, 5956.0, 26203.0, 304515.0, 633941.0, 58612.0, 9648.0, 3086.0, 1294.0, 584.0, 274.0, 146.0, 81.0, 49.0, 47.0, 20.0, 16.0, 14.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.90899658203125, -4.7515869140625, -4.59417724609375, -4.436767578125, -4.27935791015625, -4.1219482421875, -3.96453857421875, -3.80712890625, -3.64971923828125, -3.4923095703125, -3.33489990234375, -3.177490234375, -3.02008056640625, -2.8626708984375, -2.70526123046875, -2.5478515625, -2.39044189453125, -2.2330322265625, -2.07562255859375, -1.918212890625, -1.76080322265625, -1.6033935546875, -1.44598388671875, -1.28857421875, -1.13116455078125, -0.9737548828125, -0.81634521484375, -0.658935546875, -0.50152587890625, -0.3441162109375, -0.18670654296875, -0.029296875, 0.12811279296875, 0.2855224609375, 0.44293212890625, 0.600341796875, 0.75775146484375, 0.9151611328125, 1.07257080078125, 1.22998046875, 1.38739013671875, 1.5447998046875, 1.70220947265625, 1.859619140625, 2.01702880859375, 2.1744384765625, 2.33184814453125, 2.4892578125, 2.64666748046875, 2.8040771484375, 2.96148681640625, 3.118896484375, 3.27630615234375, 3.4337158203125, 3.59112548828125, 3.74853515625, 3.90594482421875, 4.0633544921875, 4.22076416015625, 4.378173828125, 4.53558349609375, 4.6929931640625, 4.85040283203125, 5.0078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 9.0, 19.0, 22.0, 67.0, 124.0, 175.0, 217.0, 157.0, 102.0, 44.0, 20.0, 8.0, 9.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.1024169921875, -3.962646484375, -3.8228759765625, -3.68310546875, -3.5433349609375, -3.403564453125, -3.2637939453125, -3.1240234375, -2.9842529296875, -2.844482421875, -2.7047119140625, -2.56494140625, -2.4251708984375, -2.285400390625, -2.1456298828125, -2.005859375, -1.8660888671875, -1.726318359375, -1.5865478515625, -1.44677734375, -1.3070068359375, -1.167236328125, -1.0274658203125, -0.8876953125, -0.7479248046875, -0.608154296875, -0.4683837890625, -0.32861328125, -0.1888427734375, -0.049072265625, 0.0906982421875, 0.23046875, 0.3702392578125, 0.510009765625, 0.6497802734375, 0.78955078125, 0.9293212890625, 1.069091796875, 1.2088623046875, 1.3486328125, 1.4884033203125, 1.628173828125, 1.7679443359375, 1.90771484375, 2.0474853515625, 2.187255859375, 2.3270263671875, 2.466796875, 2.6065673828125, 2.746337890625, 2.8861083984375, 3.02587890625, 3.1656494140625, 3.305419921875, 3.4451904296875, 3.5849609375, 3.7247314453125, 3.864501953125, 4.0042724609375, 4.14404296875, 4.2838134765625, 4.423583984375, 4.5633544921875, 4.703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 17.0, 27.0, 82.0, 141.0, 198.0, 226.0, 146.0, 99.0, 31.0, 18.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5025405883789, -64.65855407714844, -62.8145637512207, -60.970577239990234, -59.1265869140625, -57.28260040283203, -55.43861389160156, -53.594627380371094, -51.75063705444336, -49.90665054321289, -48.062660217285156, -46.21867370605469, -44.37468719482422, -42.530696868896484, -40.686710357666016, -38.84272003173828, -36.99873352050781, -35.154747009277344, -33.31075668334961, -31.46677017211914, -29.62278175354004, -27.778793334960938, -25.93480682373047, -24.090818405151367, -22.246829986572266, -20.402841567993164, -18.558853149414062, -16.714866638183594, -14.870878219604492, -13.02688980102539, -11.182902336120605, -9.33891487121582, -7.494926452636719, -5.650938510894775, -3.806950569152832, -1.9629626274108887, -0.11897468566894531, 1.7250137329101562, 3.5690011978149414, 5.412988662719727, 7.256977081298828, 9.10096549987793, 10.944952964782715, 12.7889404296875, 14.632928848266602, 16.476917266845703, 18.320903778076172, 20.164892196655273, 22.008880615234375, 23.852869033813477, 25.696857452392578, 27.540843963623047, 29.38483238220215, 31.22882080078125, 33.07280731201172, 34.91679382324219, 36.76078414916992, 38.60477066040039, 40.448760986328125, 42.292747497558594, 44.13673400878906, 45.9807243347168, 47.824710845947266, 49.668701171875, 51.51268768310547]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 7.0, 10.0, 10.0, 13.0, 14.0, 15.0, 18.0, 24.0, 27.0, 30.0, 32.0, 32.0, 34.0, 38.0, 30.0, 46.0, 51.0, 40.0, 45.0, 51.0, 46.0, 34.0, 40.0, 40.0, 32.0, 25.0, 20.0, 28.0, 28.0, 20.0, 17.0, 23.0, 10.0, 9.0, 9.0, 5.0, 9.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.858320236206055, -15.334580421447754, -14.810840606689453, -14.287100791931152, -13.763360977172852, -13.239620208740234, -12.715880393981934, -12.192140579223633, -11.668400764465332, -11.144660949707031, -10.62092113494873, -10.09718132019043, -9.573440551757812, -9.049701690673828, -8.525960922241211, -8.00222110748291, -7.478481292724609, -6.954741477966309, -6.431001663208008, -5.907261371612549, -5.383521556854248, -4.859781742095947, -4.336041450500488, -3.8123016357421875, -3.2885618209838867, -2.764822006225586, -2.241081953048706, -1.7173420190811157, -1.1936020851135254, -0.6698622703552246, -0.14612221717834473, 0.37761783599853516, 0.9013557434082031, 1.4250956773757935, 1.9488356113433838, 2.4725756645202637, 2.9963154792785645, 3.5200552940368652, 4.043795585632324, 4.567535400390625, 5.091275215148926, 5.615015029907227, 6.138754844665527, 6.662495136260986, 7.186234951019287, 7.709974765777588, 8.233715057373047, 8.757454872131348, 9.281194686889648, 9.80493450164795, 10.32867431640625, 10.85241413116455, 11.376153945922852, 11.899894714355469, 12.42363452911377, 12.94737434387207, 13.471114158630371, 13.994853973388672, 14.518593788146973, 15.042333602905273, 15.56607437133789, 16.089813232421875, 16.613554000854492, 17.13729476928711, 17.661033630371094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 13.0, 3.0, 9.0, 20.0, 16.0, 29.0, 36.0, 68.0, 92.0, 123.0, 210.0, 304.0, 465.0, 746.0, 1273.0, 2217.0, 4083.0, 8022.0, 17157.0, 41839.0, 141427.0, 2967215.0, 839675.0, 104441.0, 34454.0, 14598.0, 7024.0, 3662.0, 1989.0, 1136.0, 671.0, 427.0, 277.0, 189.0, 115.0, 83.0, 60.0, 39.0, 22.0, 11.0, 10.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-4.8046875, -4.6669921875, -4.529296875, -4.3916015625, -4.25390625, -4.1162109375, -3.978515625, -3.8408203125, -3.703125, -3.5654296875, -3.427734375, -3.2900390625, -3.15234375, -3.0146484375, -2.876953125, -2.7392578125, -2.6015625, -2.4638671875, -2.326171875, -2.1884765625, -2.05078125, -1.9130859375, -1.775390625, -1.6376953125, -1.5, -1.3623046875, -1.224609375, -1.0869140625, -0.94921875, -0.8115234375, -0.673828125, -0.5361328125, -0.3984375, -0.2607421875, -0.123046875, 0.0146484375, 0.15234375, 0.2900390625, 0.427734375, 0.5654296875, 0.703125, 0.8408203125, 0.978515625, 1.1162109375, 1.25390625, 1.3916015625, 1.529296875, 1.6669921875, 1.8046875, 1.9423828125, 2.080078125, 2.2177734375, 2.35546875, 2.4931640625, 2.630859375, 2.7685546875, 2.90625, 3.0439453125, 3.181640625, 3.3193359375, 3.45703125, 3.5947265625, 3.732421875, 3.8701171875, 4.0078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 10.0, 6.0, 11.0, 9.0, 7.0, 24.0, 17.0, 26.0, 23.0, 31.0, 34.0, 37.0, 36.0, 38.0, 58.0, 54.0, 51.0, 50.0, 45.0, 50.0, 47.0, 42.0, 58.0, 34.0, 31.0, 21.0, 28.0, 22.0, 22.0, 16.0, 10.0, 11.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.759765625, -0.7361907958984375, -0.712615966796875, -0.6890411376953125, -0.66546630859375, -0.6418914794921875, -0.618316650390625, -0.5947418212890625, -0.5711669921875, -0.5475921630859375, -0.524017333984375, -0.5004425048828125, -0.47686767578125, -0.4532928466796875, -0.429718017578125, -0.4061431884765625, -0.382568359375, -0.3589935302734375, -0.335418701171875, -0.3118438720703125, -0.28826904296875, -0.2646942138671875, -0.241119384765625, -0.2175445556640625, -0.1939697265625, -0.1703948974609375, -0.146820068359375, -0.1232452392578125, -0.09967041015625, -0.0760955810546875, -0.052520751953125, -0.0289459228515625, -0.00537109375, 0.0182037353515625, 0.041778564453125, 0.0653533935546875, 0.08892822265625, 0.1125030517578125, 0.136077880859375, 0.1596527099609375, 0.1832275390625, 0.2068023681640625, 0.230377197265625, 0.2539520263671875, 0.27752685546875, 0.3011016845703125, 0.324676513671875, 0.3482513427734375, 0.371826171875, 0.3954010009765625, 0.418975830078125, 0.4425506591796875, 0.46612548828125, 0.4897003173828125, 0.513275146484375, 0.5368499755859375, 0.5604248046875, 0.5839996337890625, 0.607574462890625, 0.6311492919921875, 0.65472412109375, 0.6782989501953125, 0.701873779296875, 0.7254486083984375, 0.7490234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 12.0, 17.0, 16.0, 20.0, 35.0, 46.0, 65.0, 102.0, 156.0, 246.0, 433.0, 744.0, 1602.0, 3446.0, 8866.0, 24660.0, 83513.0, 460749.0, 3223504.0, 290833.0, 62527.0, 19492.0, 7057.0, 2978.0, 1344.0, 668.0, 383.0, 215.0, 153.0, 114.0, 67.0, 44.0, 36.0, 33.0, 26.0, 16.0, 5.0, 12.0, 7.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-4.72265625, -4.5672607421875, -4.411865234375, -4.2564697265625, -4.10107421875, -3.9456787109375, -3.790283203125, -3.6348876953125, -3.4794921875, -3.3240966796875, -3.168701171875, -3.0133056640625, -2.85791015625, -2.7025146484375, -2.547119140625, -2.3917236328125, -2.236328125, -2.0809326171875, -1.925537109375, -1.7701416015625, -1.61474609375, -1.4593505859375, -1.303955078125, -1.1485595703125, -0.9931640625, -0.8377685546875, -0.682373046875, -0.5269775390625, -0.37158203125, -0.2161865234375, -0.060791015625, 0.0946044921875, 0.25, 0.4053955078125, 0.560791015625, 0.7161865234375, 0.87158203125, 1.0269775390625, 1.182373046875, 1.3377685546875, 1.4931640625, 1.6485595703125, 1.803955078125, 1.9593505859375, 2.11474609375, 2.2701416015625, 2.425537109375, 2.5809326171875, 2.736328125, 2.8917236328125, 3.047119140625, 3.2025146484375, 3.35791015625, 3.5133056640625, 3.668701171875, 3.8240966796875, 3.9794921875, 4.1348876953125, 4.290283203125, 4.4456787109375, 4.60107421875, 4.7564697265625, 4.911865234375, 5.0672607421875, 5.22265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 13.0, 10.0, 22.0, 21.0, 38.0, 45.0, 80.0, 154.0, 228.0, 515.0, 1620.0, 635.0, 249.0, 147.0, 88.0, 62.0, 34.0, 31.0, 23.0, 14.0, 7.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2562255859375, -1.192138671875, -1.1280517578125, -1.06396484375, -0.9998779296875, -0.935791015625, -0.8717041015625, -0.8076171875, -0.7435302734375, -0.679443359375, -0.6153564453125, -0.55126953125, -0.4871826171875, -0.423095703125, -0.3590087890625, -0.294921875, -0.2308349609375, -0.166748046875, -0.1026611328125, -0.03857421875, 0.0255126953125, 0.089599609375, 0.1536865234375, 0.2177734375, 0.2818603515625, 0.345947265625, 0.4100341796875, 0.47412109375, 0.5382080078125, 0.602294921875, 0.6663818359375, 0.73046875, 0.7945556640625, 0.858642578125, 0.9227294921875, 0.98681640625, 1.0509033203125, 1.114990234375, 1.1790771484375, 1.2431640625, 1.3072509765625, 1.371337890625, 1.4354248046875, 1.49951171875, 1.5635986328125, 1.627685546875, 1.6917724609375, 1.755859375, 1.8199462890625, 1.884033203125, 1.9481201171875, 2.01220703125, 2.0762939453125, 2.140380859375, 2.2044677734375, 2.2685546875, 2.3326416015625, 2.396728515625, 2.4608154296875, 2.52490234375, 2.5889892578125, 2.653076171875, 2.7171630859375, 2.78125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 11.0, 14.0, 51.0, 77.0, 97.0, 131.0, 184.0, 143.0, 126.0, 59.0, 41.0, 31.0, 15.0, 10.0, 8.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.526201248168945, -20.995834350585938, -20.46546745300293, -19.935100555419922, -19.40473175048828, -18.874364852905273, -18.343997955322266, -17.813631057739258, -17.28326416015625, -16.752897262573242, -16.222530364990234, -15.69216251373291, -15.161795616149902, -14.631427764892578, -14.10106086730957, -13.570693969726562, -13.040326118469238, -12.50995922088623, -11.979591369628906, -11.449224472045898, -10.91885757446289, -10.388490676879883, -9.858122825622559, -9.32775592803955, -8.797388076782227, -8.267021179199219, -7.736653804779053, -7.206286430358887, -6.675919532775879, -6.145552158355713, -5.615184783935547, -5.084817886352539, -4.554450988769531, -4.024083614349365, -3.4937167167663574, -2.9633493423461914, -2.4329822063446045, -1.9026150703430176, -1.3722476959228516, -0.8418805599212646, -0.31151342391967773, 0.21885377168655396, 0.7492209672927856, 1.279588222503662, 1.809955358505249, 2.340322494506836, 2.870689868927002, 3.401057004928589, 3.931424140930176, 4.461791515350342, 4.99215841293335, 5.522525787353516, 6.052892684936523, 6.5832600593566895, 7.1136274337768555, 7.643994331359863, 8.174362182617188, 8.704729080200195, 9.23509693145752, 9.765463829040527, 10.295830726623535, 10.82619857788086, 11.356565475463867, 11.886932373046875, 12.417299270629883]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 4.0, 13.0, 8.0, 12.0, 6.0, 8.0, 20.0, 21.0, 25.0, 27.0, 31.0, 23.0, 37.0, 42.0, 37.0, 42.0, 42.0, 49.0, 37.0, 40.0, 43.0, 31.0, 34.0, 34.0, 43.0, 32.0, 20.0, 19.0, 32.0, 32.0, 28.0, 19.0, 25.0, 16.0, 14.0, 13.0, 11.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.710840702056885, -5.529642581939697, -5.348443984985352, -5.167245864868164, -4.986047744750977, -4.804849147796631, -4.623651027679443, -4.442452430725098, -4.26125431060791, -4.080056190490723, -3.898857593536377, -3.7176594734191895, -3.536461114883423, -3.3552627563476562, -3.1740646362304688, -2.992866277694702, -2.8116679191589355, -2.630469560623169, -2.4492712020874023, -2.268073081970215, -2.0868747234344482, -1.9056763648986816, -1.7244781255722046, -1.5432798862457275, -1.362081527709961, -1.1808831691741943, -0.9996849298477173, -0.8184866309165955, -0.6372883319854736, -0.4560900330543518, -0.27489173412323, -0.09369349479675293, 0.08750438690185547, 0.2687026858329773, 0.4499009847640991, 0.631099283695221, 0.8122975826263428, 0.9934958815574646, 1.1746941804885864, 1.3558924198150635, 1.53709077835083, 1.7182891368865967, 1.8994873762130737, 2.080685615539551, 2.2618839740753174, 2.443082332611084, 2.6242804527282715, 2.805478811264038, 2.9866771697998047, 3.1678755283355713, 3.349073886871338, 3.5302720069885254, 3.711470365524292, 3.8926687240600586, 4.073866844177246, 4.255064964294434, 4.436263561248779, 4.617461681365967, 4.7986602783203125, 4.9798583984375, 5.1610565185546875, 5.342255115509033, 5.523453235626221, 5.704651832580566, 5.885849952697754]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 6.0, 10.0, 14.0, 20.0, 33.0, 58.0, 107.0, 197.0, 394.0, 953.0, 2603.0, 8447.0, 30250.0, 128867.0, 490151.0, 295628.0, 66154.0, 16643.0, 4992.0, 1708.0, 650.0, 288.0, 154.0, 81.0, 51.0, 31.0, 20.0, 8.0, 6.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.8316650390625, -7.585205078125, -7.3387451171875, -7.09228515625, -6.8458251953125, -6.599365234375, -6.3529052734375, -6.1064453125, -5.8599853515625, -5.613525390625, -5.3670654296875, -5.12060546875, -4.8741455078125, -4.627685546875, -4.3812255859375, -4.134765625, -3.8883056640625, -3.641845703125, -3.3953857421875, -3.14892578125, -2.9024658203125, -2.656005859375, -2.4095458984375, -2.1630859375, -1.9166259765625, -1.670166015625, -1.4237060546875, -1.17724609375, -0.9307861328125, -0.684326171875, -0.4378662109375, -0.19140625, 0.0550537109375, 0.301513671875, 0.5479736328125, 0.79443359375, 1.0408935546875, 1.287353515625, 1.5338134765625, 1.7802734375, 2.0267333984375, 2.273193359375, 2.5196533203125, 2.76611328125, 3.0125732421875, 3.259033203125, 3.5054931640625, 3.751953125, 3.9984130859375, 4.244873046875, 4.4913330078125, 4.73779296875, 4.9842529296875, 5.230712890625, 5.4771728515625, 5.7236328125, 5.9700927734375, 6.216552734375, 6.4630126953125, 6.70947265625, 6.9559326171875, 7.202392578125, 7.4488525390625, 7.6953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 9.0, 12.0, 8.0, 7.0, 10.0, 12.0, 14.0, 22.0, 28.0, 27.0, 31.0, 47.0, 40.0, 44.0, 47.0, 51.0, 53.0, 51.0, 64.0, 48.0, 39.0, 53.0, 48.0, 33.0, 42.0, 32.0, 26.0, 21.0, 11.0, 15.0, 15.0, 10.0, 5.0, 6.0, 6.0, 2.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78662109375, -0.7624053955078125, -0.738189697265625, -0.7139739990234375, -0.68975830078125, -0.6655426025390625, -0.641326904296875, -0.6171112060546875, -0.5928955078125, -0.5686798095703125, -0.544464111328125, -0.5202484130859375, -0.49603271484375, -0.4718170166015625, -0.447601318359375, -0.4233856201171875, -0.399169921875, -0.3749542236328125, -0.350738525390625, -0.3265228271484375, -0.30230712890625, -0.2780914306640625, -0.253875732421875, -0.2296600341796875, -0.2054443359375, -0.1812286376953125, -0.157012939453125, -0.1327972412109375, -0.10858154296875, -0.0843658447265625, -0.060150146484375, -0.0359344482421875, -0.01171875, 0.0124969482421875, 0.036712646484375, 0.0609283447265625, 0.08514404296875, 0.1093597412109375, 0.133575439453125, 0.1577911376953125, 0.1820068359375, 0.2062225341796875, 0.230438232421875, 0.2546539306640625, 0.27886962890625, 0.3030853271484375, 0.327301025390625, 0.3515167236328125, 0.375732421875, 0.3999481201171875, 0.424163818359375, 0.4483795166015625, 0.47259521484375, 0.4968109130859375, 0.521026611328125, 0.5452423095703125, 0.5694580078125, 0.5936737060546875, 0.617889404296875, 0.6421051025390625, 0.66632080078125, 0.6905364990234375, 0.714752197265625, 0.7389678955078125, 0.76318359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 10.0, 16.0, 8.0, 26.0, 25.0, 41.0, 50.0, 63.0, 77.0, 120.0, 152.0, 192.0, 267.0, 342.0, 476.0, 825.0, 1395.0, 2939.0, 7207.0, 19718.0, 56381.0, 161973.0, 369005.0, 271292.0, 99716.0, 33840.0, 12226.0, 4751.0, 2082.0, 1066.0, 646.0, 429.0, 305.0, 221.0, 168.0, 120.0, 83.0, 70.0, 62.0, 46.0, 41.0, 19.0, 13.0, 11.0, 6.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.05078125, -3.930816650390625, -3.81085205078125, -3.690887451171875, -3.5709228515625, -3.450958251953125, -3.33099365234375, -3.211029052734375, -3.091064453125, -2.971099853515625, -2.85113525390625, -2.731170654296875, -2.6112060546875, -2.491241455078125, -2.37127685546875, -2.251312255859375, -2.13134765625, -2.011383056640625, -1.89141845703125, -1.771453857421875, -1.6514892578125, -1.531524658203125, -1.41156005859375, -1.291595458984375, -1.171630859375, -1.051666259765625, -0.93170166015625, -0.811737060546875, -0.6917724609375, -0.571807861328125, -0.45184326171875, -0.331878662109375, -0.2119140625, -0.091949462890625, 0.02801513671875, 0.147979736328125, 0.2679443359375, 0.387908935546875, 0.50787353515625, 0.627838134765625, 0.747802734375, 0.867767333984375, 0.98773193359375, 1.107696533203125, 1.2276611328125, 1.347625732421875, 1.46759033203125, 1.587554931640625, 1.70751953125, 1.827484130859375, 1.94744873046875, 2.067413330078125, 2.1873779296875, 2.307342529296875, 2.42730712890625, 2.547271728515625, 2.667236328125, 2.787200927734375, 2.90716552734375, 3.027130126953125, 3.1470947265625, 3.267059326171875, 3.38702392578125, 3.506988525390625, 3.626953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 7.0, 6.0, 2.0, 4.0, 17.0, 17.0, 12.0, 21.0, 24.0, 25.0, 29.0, 36.0, 32.0, 35.0, 37.0, 36.0, 40.0, 44.0, 38.0, 44.0, 42.0, 49.0, 37.0, 31.0, 35.0, 37.0, 34.0, 37.0, 24.0, 23.0, 20.0, 29.0, 17.0, 15.0, 10.0, 8.0, 6.0, 7.0, 7.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.34344482421875, -2.2572021484375, -2.17095947265625, -2.084716796875, -1.99847412109375, -1.9122314453125, -1.82598876953125, -1.73974609375, -1.65350341796875, -1.5672607421875, -1.48101806640625, -1.394775390625, -1.30853271484375, -1.2222900390625, -1.13604736328125, -1.0498046875, -0.96356201171875, -0.8773193359375, -0.79107666015625, -0.704833984375, -0.61859130859375, -0.5323486328125, -0.44610595703125, -0.35986328125, -0.27362060546875, -0.1873779296875, -0.10113525390625, -0.014892578125, 0.07135009765625, 0.1575927734375, 0.24383544921875, 0.330078125, 0.41632080078125, 0.5025634765625, 0.58880615234375, 0.675048828125, 0.76129150390625, 0.8475341796875, 0.93377685546875, 1.02001953125, 1.10626220703125, 1.1925048828125, 1.27874755859375, 1.364990234375, 1.45123291015625, 1.5374755859375, 1.62371826171875, 1.7099609375, 1.79620361328125, 1.8824462890625, 1.96868896484375, 2.054931640625, 2.14117431640625, 2.2274169921875, 2.31365966796875, 2.39990234375, 2.48614501953125, 2.5723876953125, 2.65863037109375, 2.744873046875, 2.83111572265625, 2.9173583984375, 3.00360107421875, 3.08984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 1.0, 4.0, 2.0, 4.0, 9.0, 10.0, 13.0, 13.0, 25.0, 42.0, 52.0, 98.0, 154.0, 301.0, 589.0, 1445.0, 3952.0, 13150.0, 70002.0, 495892.0, 393319.0, 52995.0, 10736.0, 3257.0, 1262.0, 548.0, 280.0, 151.0, 82.0, 55.0, 49.0, 14.0, 13.0, 12.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.392486572265625, -3.27520751953125, -3.157928466796875, -3.0406494140625, -2.923370361328125, -2.80609130859375, -2.688812255859375, -2.571533203125, -2.454254150390625, -2.33697509765625, -2.219696044921875, -2.1024169921875, -1.985137939453125, -1.86785888671875, -1.750579833984375, -1.63330078125, -1.516021728515625, -1.39874267578125, -1.281463623046875, -1.1641845703125, -1.046905517578125, -0.92962646484375, -0.812347412109375, -0.695068359375, -0.577789306640625, -0.46051025390625, -0.343231201171875, -0.2259521484375, -0.108673095703125, 0.00860595703125, 0.125885009765625, 0.2431640625, 0.360443115234375, 0.47772216796875, 0.595001220703125, 0.7122802734375, 0.829559326171875, 0.94683837890625, 1.064117431640625, 1.181396484375, 1.298675537109375, 1.41595458984375, 1.533233642578125, 1.6505126953125, 1.767791748046875, 1.88507080078125, 2.002349853515625, 2.11962890625, 2.236907958984375, 2.35418701171875, 2.471466064453125, 2.5887451171875, 2.706024169921875, 2.82330322265625, 2.940582275390625, 3.057861328125, 3.175140380859375, 3.29241943359375, 3.409698486328125, 3.5269775390625, 3.644256591796875, 3.76153564453125, 3.878814697265625, 3.99609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 5.0, 5.0, 6.0, 14.0, 7.0, 16.0, 9.0, 25.0, 19.0, 23.0, 25.0, 39.0, 46.0, 71.0, 85.0, 122.0, 92.0, 83.0, 54.0, 41.0, 39.0, 30.0, 30.0, 22.0, 19.0, 20.0, 4.0, 11.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.0004062652587890625, -0.00039550289511680603, -0.00038474053144454956, -0.0003739781677722931, -0.0003632158041000366, -0.00035245344042778015, -0.0003416910767555237, -0.0003309287130832672, -0.00032016634941101074, -0.00030940398573875427, -0.0002986416220664978, -0.00028787925839424133, -0.00027711689472198486, -0.0002663545310497284, -0.0002555921673774719, -0.00024482980370521545, -0.00023406744003295898, -0.00022330507636070251, -0.00021254271268844604, -0.00020178034901618958, -0.0001910179853439331, -0.00018025562167167664, -0.00016949325799942017, -0.0001587308943271637, -0.00014796853065490723, -0.00013720616698265076, -0.0001264438033103943, -0.00011568143963813782, -0.00010491907596588135, -9.415671229362488e-05, -8.339434862136841e-05, -7.263198494911194e-05, -6.186962127685547e-05, -5.1107257604599e-05, -4.034489393234253e-05, -2.958253026008606e-05, -1.882016658782959e-05, -8.05780291557312e-06, 2.7045607566833496e-06, 1.346692442893982e-05, 2.422928810119629e-05, 3.499165177345276e-05, 4.575401544570923e-05, 5.65163791179657e-05, 6.727874279022217e-05, 7.804110646247864e-05, 8.880347013473511e-05, 9.956583380699158e-05, 0.00011032819747924805, 0.00012109056115150452, 0.00013185292482376099, 0.00014261528849601746, 0.00015337765216827393, 0.0001641400158405304, 0.00017490237951278687, 0.00018566474318504333, 0.0001964271068572998, 0.00020718947052955627, 0.00021795183420181274, 0.00022871419787406921, 0.00023947656154632568, 0.00025023892521858215, 0.0002610012888908386, 0.0002717636525630951, 0.00028252601623535156]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 10.0, 7.0, 5.0, 12.0, 24.0, 15.0, 38.0, 35.0, 79.0, 98.0, 159.0, 283.0, 519.0, 1001.0, 2154.0, 5212.0, 18268.0, 106296.0, 625479.0, 241904.0, 33015.0, 7891.0, 2993.0, 1343.0, 635.0, 412.0, 234.0, 135.0, 99.0, 60.0, 32.0, 23.0, 17.0, 14.0, 8.0, 11.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.21923828125, -3.0986328125, -2.97802734375, -2.857421875, -2.73681640625, -2.6162109375, -2.49560546875, -2.375, -2.25439453125, -2.1337890625, -2.01318359375, -1.892578125, -1.77197265625, -1.6513671875, -1.53076171875, -1.41015625, -1.28955078125, -1.1689453125, -1.04833984375, -0.927734375, -0.80712890625, -0.6865234375, -0.56591796875, -0.4453125, -0.32470703125, -0.2041015625, -0.08349609375, 0.037109375, 0.15771484375, 0.2783203125, 0.39892578125, 0.51953125, 0.64013671875, 0.7607421875, 0.88134765625, 1.001953125, 1.12255859375, 1.2431640625, 1.36376953125, 1.484375, 1.60498046875, 1.7255859375, 1.84619140625, 1.966796875, 2.08740234375, 2.2080078125, 2.32861328125, 2.44921875, 2.56982421875, 2.6904296875, 2.81103515625, 2.931640625, 3.05224609375, 3.1728515625, 3.29345703125, 3.4140625, 3.53466796875, 3.6552734375, 3.77587890625, 3.896484375, 4.01708984375, 4.1376953125, 4.25830078125, 4.37890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 2.0, 11.0, 14.0, 12.0, 13.0, 25.0, 39.0, 37.0, 43.0, 76.0, 58.0, 105.0, 98.0, 97.0, 86.0, 56.0, 57.0, 44.0, 28.0, 18.0, 22.0, 8.0, 3.0, 7.0, 2.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.966064453125, -1.89892578125, -1.831787109375, -1.7646484375, -1.697509765625, -1.63037109375, -1.563232421875, -1.49609375, -1.428955078125, -1.36181640625, -1.294677734375, -1.2275390625, -1.160400390625, -1.09326171875, -1.026123046875, -0.958984375, -0.891845703125, -0.82470703125, -0.757568359375, -0.6904296875, -0.623291015625, -0.55615234375, -0.489013671875, -0.421875, -0.354736328125, -0.28759765625, -0.220458984375, -0.1533203125, -0.086181640625, -0.01904296875, 0.048095703125, 0.115234375, 0.182373046875, 0.24951171875, 0.316650390625, 0.3837890625, 0.450927734375, 0.51806640625, 0.585205078125, 0.65234375, 0.719482421875, 0.78662109375, 0.853759765625, 0.9208984375, 0.988037109375, 1.05517578125, 1.122314453125, 1.189453125, 1.256591796875, 1.32373046875, 1.390869140625, 1.4580078125, 1.525146484375, 1.59228515625, 1.659423828125, 1.7265625, 1.793701171875, 1.86083984375, 1.927978515625, 1.9951171875, 2.062255859375, 2.12939453125, 2.196533203125, 2.263671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 9.0, 20.0, 39.0, 67.0, 99.0, 160.0, 176.0, 152.0, 109.0, 72.0, 47.0, 29.0, 11.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.64947509765625, -35.317970275878906, -33.98646545410156, -32.65495681762695, -31.32345199584961, -29.991947174072266, -28.66044044494629, -27.328933715820312, -25.99742889404297, -24.665924072265625, -23.33441734313965, -22.002910614013672, -20.671405792236328, -19.339900970458984, -18.008394241333008, -16.67688751220703, -15.345382690429688, -14.013876914978027, -12.682371139526367, -11.350865364074707, -10.019359588623047, -8.687853813171387, -7.356348037719727, -6.024842262268066, -4.693336486816406, -3.361830711364746, -2.030324935913086, -0.6988191604614258, 0.6326866149902344, 1.9641923904418945, 3.2956981658935547, 4.627203941345215, 5.958713531494141, 7.290219306945801, 8.621725082397461, 9.953230857849121, 11.284736633300781, 12.616242408752441, 13.947748184204102, 15.279253959655762, 16.610759735107422, 17.942264556884766, 19.273771286010742, 20.60527801513672, 21.936782836914062, 23.268287658691406, 24.599794387817383, 25.93130111694336, 27.262805938720703, 28.594310760498047, 29.925817489624023, 31.25732421875, 32.588829040527344, 33.92033386230469, 35.25183868408203, 36.58334732055664, 37.914852142333984, 39.24635696411133, 40.57786560058594, 41.90937042236328, 43.240875244140625, 44.57238006591797, 45.90388488769531, 47.23539352416992, 48.566898345947266]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 8.0, 7.0, 6.0, 9.0, 9.0, 13.0, 9.0, 14.0, 15.0, 21.0, 27.0, 17.0, 36.0, 36.0, 28.0, 43.0, 35.0, 36.0, 46.0, 41.0, 46.0, 44.0, 40.0, 46.0, 51.0, 36.0, 41.0, 22.0, 31.0, 24.0, 29.0, 29.0, 20.0, 13.0, 12.0, 16.0, 12.0, 3.0, 11.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.586642265319824, -14.08240032196045, -13.578158378601074, -13.0739164352417, -12.569674491882324, -12.06543254852295, -11.561189651489258, -11.056947708129883, -10.552705764770508, -10.048463821411133, -9.544221878051758, -9.039979934692383, -8.535737991333008, -8.031496047973633, -7.5272536277771, -7.023011684417725, -6.518770217895508, -6.014528274536133, -5.510286331176758, -5.006044387817383, -4.501802444458008, -3.9975602626800537, -3.4933180809020996, -2.9890761375427246, -2.4848341941833496, -1.9805922508239746, -1.47635018825531, -0.9721081256866455, -0.4678661823272705, 0.03637576103210449, 0.5406179428100586, 1.0448598861694336, 1.5491008758544922, 2.053342819213867, 2.557584762573242, 3.0618269443511963, 3.5660688877105713, 4.070310592651367, 4.5745530128479, 5.078794956207275, 5.58303689956665, 6.087278842926025, 6.5915207862854, 7.095763206481934, 7.600005149841309, 8.104247093200684, 8.608489036560059, 9.112730979919434, 9.616972923278809, 10.121214866638184, 10.625456809997559, 11.129698753356934, 11.633940696716309, 12.138182640075684, 12.642425537109375, 13.14666748046875, 13.650909423828125, 14.1551513671875, 14.659393310546875, 15.16363525390625, 15.667877197265625, 16.172119140625, 16.676361083984375, 17.18060302734375, 17.684844970703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 11.0, 22.0, 16.0, 32.0, 48.0, 53.0, 68.0, 120.0, 187.0, 296.0, 421.0, 704.0, 1111.0, 1871.0, 3349.0, 6151.0, 12927.0, 28387.0, 76750.0, 304462.0, 3208946.0, 395204.0, 90039.0, 32800.0, 14285.0, 7078.0, 3662.0, 2083.0, 1147.0, 726.0, 468.0, 273.0, 182.0, 103.0, 86.0, 57.0, 41.0, 41.0, 16.0, 14.0, 9.0, 5.0, 4.0, 0.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.274993896484375, -4.14373779296875, -4.012481689453125, -3.8812255859375, -3.749969482421875, -3.61871337890625, -3.487457275390625, -3.356201171875, -3.224945068359375, -3.09368896484375, -2.962432861328125, -2.8311767578125, -2.699920654296875, -2.56866455078125, -2.437408447265625, -2.30615234375, -2.174896240234375, -2.04364013671875, -1.912384033203125, -1.7811279296875, -1.649871826171875, -1.51861572265625, -1.387359619140625, -1.256103515625, -1.124847412109375, -0.99359130859375, -0.862335205078125, -0.7310791015625, -0.599822998046875, -0.46856689453125, -0.337310791015625, -0.2060546875, -0.074798583984375, 0.05645751953125, 0.187713623046875, 0.3189697265625, 0.450225830078125, 0.58148193359375, 0.712738037109375, 0.843994140625, 0.975250244140625, 1.10650634765625, 1.237762451171875, 1.3690185546875, 1.500274658203125, 1.63153076171875, 1.762786865234375, 1.89404296875, 2.025299072265625, 2.15655517578125, 2.287811279296875, 2.4190673828125, 2.550323486328125, 2.68157958984375, 2.812835693359375, 2.944091796875, 3.075347900390625, 3.20660400390625, 3.337860107421875, 3.4691162109375, 3.600372314453125, 3.73162841796875, 3.862884521484375, 3.994140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 11.0, 8.0, 6.0, 15.0, 18.0, 11.0, 14.0, 22.0, 31.0, 28.0, 46.0, 44.0, 42.0, 51.0, 43.0, 61.0, 45.0, 57.0, 52.0, 53.0, 40.0, 53.0, 34.0, 34.0, 30.0, 33.0, 25.0, 21.0, 18.0, 11.0, 9.0, 11.0, 7.0, 4.0, 1.0, 7.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8538131713867188, -0.8292083740234375, -0.8046035766601562, -0.779998779296875, -0.7553939819335938, -0.7307891845703125, -0.7061843872070312, -0.68157958984375, -0.6569747924804688, -0.6323699951171875, -0.6077651977539062, -0.583160400390625, -0.5585556030273438, -0.5339508056640625, -0.5093460083007812, -0.4847412109375, -0.46013641357421875, -0.4355316162109375, -0.41092681884765625, -0.386322021484375, -0.36171722412109375, -0.3371124267578125, -0.31250762939453125, -0.28790283203125, -0.26329803466796875, -0.2386932373046875, -0.21408843994140625, -0.189483642578125, -0.16487884521484375, -0.1402740478515625, -0.11566925048828125, -0.091064453125, -0.06645965576171875, -0.0418548583984375, -0.01725006103515625, 0.007354736328125, 0.03195953369140625, 0.0565643310546875, 0.08116912841796875, 0.10577392578125, 0.13037872314453125, 0.1549835205078125, 0.17958831787109375, 0.204193115234375, 0.22879791259765625, 0.2534027099609375, 0.27800750732421875, 0.3026123046875, 0.32721710205078125, 0.3518218994140625, 0.37642669677734375, 0.401031494140625, 0.42563629150390625, 0.4502410888671875, 0.47484588623046875, 0.49945068359375, 0.5240554809570312, 0.5486602783203125, 0.5732650756835938, 0.597869873046875, 0.6224746704101562, 0.6470794677734375, 0.6716842651367188, 0.6962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 7.0, 13.0, 22.0, 20.0, 34.0, 38.0, 54.0, 104.0, 139.0, 207.0, 330.0, 624.0, 1070.0, 1910.0, 3631.0, 7336.0, 14789.0, 33052.0, 81296.0, 247420.0, 1968428.0, 1470468.0, 226670.0, 76238.0, 31741.0, 14174.0, 6593.0, 3389.0, 1834.0, 1035.0, 596.0, 340.0, 236.0, 147.0, 96.0, 57.0, 38.0, 35.0, 23.0, 14.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.710052490234375, -2.60955810546875, -2.509063720703125, -2.4085693359375, -2.308074951171875, -2.20758056640625, -2.107086181640625, -2.006591796875, -1.906097412109375, -1.80560302734375, -1.705108642578125, -1.6046142578125, -1.504119873046875, -1.40362548828125, -1.303131103515625, -1.20263671875, -1.102142333984375, -1.00164794921875, -0.901153564453125, -0.8006591796875, -0.700164794921875, -0.59967041015625, -0.499176025390625, -0.398681640625, -0.298187255859375, -0.19769287109375, -0.097198486328125, 0.0032958984375, 0.103790283203125, 0.20428466796875, 0.304779052734375, 0.4052734375, 0.505767822265625, 0.60626220703125, 0.706756591796875, 0.8072509765625, 0.907745361328125, 1.00823974609375, 1.108734130859375, 1.209228515625, 1.309722900390625, 1.41021728515625, 1.510711669921875, 1.6112060546875, 1.711700439453125, 1.81219482421875, 1.912689208984375, 2.01318359375, 2.113677978515625, 2.21417236328125, 2.314666748046875, 2.4151611328125, 2.515655517578125, 2.61614990234375, 2.716644287109375, 2.817138671875, 2.917633056640625, 3.01812744140625, 3.118621826171875, 3.2191162109375, 3.319610595703125, 3.42010498046875, 3.520599365234375, 3.62109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 9.0, 16.0, 26.0, 19.0, 42.0, 34.0, 44.0, 65.0, 116.0, 161.0, 248.0, 494.0, 1203.0, 650.0, 305.0, 186.0, 93.0, 83.0, 64.0, 53.0, 35.0, 32.0, 20.0, 12.0, 13.0, 6.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4259490966796875, -1.370452880859375, -1.3149566650390625, -1.25946044921875, -1.2039642333984375, -1.148468017578125, -1.0929718017578125, -1.0374755859375, -0.9819793701171875, -0.926483154296875, -0.8709869384765625, -0.81549072265625, -0.7599945068359375, -0.704498291015625, -0.6490020751953125, -0.593505859375, -0.5380096435546875, -0.482513427734375, -0.4270172119140625, -0.37152099609375, -0.3160247802734375, -0.260528564453125, -0.2050323486328125, -0.1495361328125, -0.0940399169921875, -0.038543701171875, 0.0169525146484375, 0.07244873046875, 0.1279449462890625, 0.183441162109375, 0.2389373779296875, 0.29443359375, 0.3499298095703125, 0.405426025390625, 0.4609222412109375, 0.51641845703125, 0.5719146728515625, 0.627410888671875, 0.6829071044921875, 0.7384033203125, 0.7938995361328125, 0.849395751953125, 0.9048919677734375, 0.96038818359375, 1.0158843994140625, 1.071380615234375, 1.1268768310546875, 1.182373046875, 1.2378692626953125, 1.293365478515625, 1.3488616943359375, 1.40435791015625, 1.4598541259765625, 1.515350341796875, 1.5708465576171875, 1.6263427734375, 1.6818389892578125, 1.737335205078125, 1.7928314208984375, 1.84832763671875, 1.9038238525390625, 1.959320068359375, 2.0148162841796875, 2.0703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 14.0, 10.0, 32.0, 47.0, 105.0, 163.0, 181.0, 165.0, 113.0, 95.0, 40.0, 18.0, 13.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.20398712158203, -18.53911590576172, -17.874244689941406, -17.209373474121094, -16.54450225830078, -15.879631042480469, -15.214759826660156, -14.549888610839844, -13.885017395019531, -13.220146179199219, -12.555274963378906, -11.890403747558594, -11.225532531738281, -10.560661315917969, -9.895790100097656, -9.230918884277344, -8.566047668457031, -7.901176452636719, -7.236305236816406, -6.571434020996094, -5.906562805175781, -5.241691589355469, -4.576820373535156, -3.9119491577148438, -3.2470779418945312, -2.5822067260742188, -1.9173355102539062, -1.2524642944335938, -0.5875930786132812, 0.07727813720703125, 0.7421493530273438, 1.4070205688476562, 2.0718917846679688, 2.7367630004882812, 3.4016342163085938, 4.066505432128906, 4.731376647949219, 5.396247863769531, 6.061119079589844, 6.725990295410156, 7.390861511230469, 8.055732727050781, 8.720603942871094, 9.385475158691406, 10.050346374511719, 10.715217590332031, 11.380088806152344, 12.044960021972656, 12.709831237792969, 13.374702453613281, 14.039573669433594, 14.704444885253906, 15.369316101074219, 16.03418731689453, 16.699058532714844, 17.363929748535156, 18.02880096435547, 18.69367218017578, 19.358543395996094, 20.023414611816406, 20.68828582763672, 21.35315704345703, 22.018028259277344, 22.682899475097656, 23.34777069091797]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 11.0, 12.0, 6.0, 10.0, 14.0, 16.0, 24.0, 22.0, 28.0, 30.0, 28.0, 24.0, 45.0, 35.0, 37.0, 41.0, 37.0, 56.0, 43.0, 51.0, 39.0, 38.0, 49.0, 48.0, 26.0, 34.0, 28.0, 21.0, 32.0, 15.0, 18.0, 13.0, 13.0, 11.0, 6.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.75253963470459, -7.532620906829834, -7.312702178955078, -7.0927839279174805, -6.872865200042725, -6.652946472167969, -6.433027744293213, -6.213109016418457, -5.993190288543701, -5.773271560668945, -5.5533528327941895, -5.333434104919434, -5.113515853881836, -4.89359712600708, -4.673678398132324, -4.453759670257568, -4.2338409423828125, -4.013922214508057, -3.79400372505188, -3.574084997177124, -3.354166269302368, -3.1342477798461914, -2.9143290519714355, -2.6944103240966797, -2.474492073059082, -2.254573345184326, -2.0346548557281494, -1.8147361278533936, -1.5948173999786377, -1.3748987913131714, -1.154980182647705, -0.9350614547729492, -0.7151427268981934, -0.4952240586280823, -0.2753054201602936, -0.05538678169250488, 0.1645318865776062, 0.3844505548477173, 0.6043691635131836, 0.8242878913879395, 1.0442065000534058, 1.264125108718872, 1.484043836593628, 1.7039624452590942, 1.9238810539245605, 2.1437997817993164, 2.3637185096740723, 2.583637237548828, 2.803555727005005, 3.0234744548797607, 3.2433929443359375, 3.4633116722106934, 3.683230400085449, 3.903149127960205, 4.123067855834961, 4.342986106872559, 4.5629048347473145, 4.78282356262207, 5.002742290496826, 5.222661018371582, 5.44257926940918, 5.6624979972839355, 5.882416725158691, 6.102335453033447, 6.322254180908203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 14.0, 24.0, 32.0, 49.0, 81.0, 115.0, 179.0, 253.0, 435.0, 826.0, 1587.0, 3271.0, 7338.0, 17054.0, 42284.0, 116329.0, 429672.0, 288192.0, 84065.0, 32294.0, 13072.0, 5713.0, 2576.0, 1289.0, 711.0, 415.0, 227.0, 146.0, 86.0, 74.0, 36.0, 17.0, 16.0, 12.0, 12.0, 7.0, 5.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.76068115234375, -4.6112060546875, -4.46173095703125, -4.312255859375, -4.16278076171875, -4.0133056640625, -3.86383056640625, -3.71435546875, -3.56488037109375, -3.4154052734375, -3.26593017578125, -3.116455078125, -2.96697998046875, -2.8175048828125, -2.66802978515625, -2.5185546875, -2.36907958984375, -2.2196044921875, -2.07012939453125, -1.920654296875, -1.77117919921875, -1.6217041015625, -1.47222900390625, -1.32275390625, -1.17327880859375, -1.0238037109375, -0.87432861328125, -0.724853515625, -0.57537841796875, -0.4259033203125, -0.27642822265625, -0.126953125, 0.02252197265625, 0.1719970703125, 0.32147216796875, 0.470947265625, 0.62042236328125, 0.7698974609375, 0.91937255859375, 1.06884765625, 1.21832275390625, 1.3677978515625, 1.51727294921875, 1.666748046875, 1.81622314453125, 1.9656982421875, 2.11517333984375, 2.2646484375, 2.41412353515625, 2.5635986328125, 2.71307373046875, 2.862548828125, 3.01202392578125, 3.1614990234375, 3.31097412109375, 3.46044921875, 3.60992431640625, 3.7593994140625, 3.90887451171875, 4.058349609375, 4.20782470703125, 4.3572998046875, 4.50677490234375, 4.65625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 7.0, 7.0, 11.0, 15.0, 18.0, 19.0, 25.0, 28.0, 36.0, 45.0, 43.0, 46.0, 43.0, 42.0, 54.0, 61.0, 59.0, 55.0, 62.0, 38.0, 31.0, 39.0, 30.0, 36.0, 33.0, 23.0, 18.0, 15.0, 15.0, 10.0, 8.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.955078125, -0.9302139282226562, -0.9053497314453125, -0.8804855346679688, -0.855621337890625, -0.8307571411132812, -0.8058929443359375, -0.7810287475585938, -0.75616455078125, -0.7313003540039062, -0.7064361572265625, -0.6815719604492188, -0.656707763671875, -0.6318435668945312, -0.6069793701171875, -0.5821151733398438, -0.5572509765625, -0.5323867797851562, -0.5075225830078125, -0.48265838623046875, -0.457794189453125, -0.43292999267578125, -0.4080657958984375, -0.38320159912109375, -0.35833740234375, -0.33347320556640625, -0.3086090087890625, -0.28374481201171875, -0.258880615234375, -0.23401641845703125, -0.2091522216796875, -0.18428802490234375, -0.159423828125, -0.13455963134765625, -0.1096954345703125, -0.08483123779296875, -0.059967041015625, -0.03510284423828125, -0.0102386474609375, 0.01462554931640625, 0.03948974609375, 0.06435394287109375, 0.0892181396484375, 0.11408233642578125, 0.138946533203125, 0.16381072998046875, 0.1886749267578125, 0.21353912353515625, 0.2384033203125, 0.26326751708984375, 0.2881317138671875, 0.31299591064453125, 0.337860107421875, 0.36272430419921875, 0.3875885009765625, 0.41245269775390625, 0.43731689453125, 0.46218109130859375, 0.4870452880859375, 0.5119094848632812, 0.536773681640625, 0.5616378784179688, 0.5865020751953125, 0.6113662719726562, 0.63623046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 13.0, 13.0, 25.0, 40.0, 49.0, 68.0, 81.0, 114.0, 172.0, 238.0, 348.0, 565.0, 1096.0, 2460.0, 7032.0, 21928.0, 75023.0, 289630.0, 476598.0, 121252.0, 34142.0, 10503.0, 3596.0, 1471.0, 698.0, 408.0, 279.0, 173.0, 130.0, 94.0, 68.0, 47.0, 48.0, 31.0, 28.0, 21.0, 16.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.311859130859375, -3.18035888671875, -3.048858642578125, -2.9173583984375, -2.785858154296875, -2.65435791015625, -2.522857666015625, -2.391357421875, -2.259857177734375, -2.12835693359375, -1.996856689453125, -1.8653564453125, -1.733856201171875, -1.60235595703125, -1.470855712890625, -1.33935546875, -1.207855224609375, -1.07635498046875, -0.944854736328125, -0.8133544921875, -0.681854248046875, -0.55035400390625, -0.418853759765625, -0.287353515625, -0.155853271484375, -0.02435302734375, 0.107147216796875, 0.2386474609375, 0.370147705078125, 0.50164794921875, 0.633148193359375, 0.7646484375, 0.896148681640625, 1.02764892578125, 1.159149169921875, 1.2906494140625, 1.422149658203125, 1.55364990234375, 1.685150146484375, 1.816650390625, 1.948150634765625, 2.07965087890625, 2.211151123046875, 2.3426513671875, 2.474151611328125, 2.60565185546875, 2.737152099609375, 2.86865234375, 3.000152587890625, 3.13165283203125, 3.263153076171875, 3.3946533203125, 3.526153564453125, 3.65765380859375, 3.789154052734375, 3.920654296875, 4.052154541015625, 4.18365478515625, 4.315155029296875, 4.4466552734375, 4.578155517578125, 4.70965576171875, 4.841156005859375, 4.97265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 7.0, 4.0, 5.0, 14.0, 10.0, 17.0, 17.0, 20.0, 26.0, 18.0, 26.0, 28.0, 32.0, 39.0, 29.0, 35.0, 29.0, 34.0, 46.0, 37.0, 40.0, 42.0, 45.0, 35.0, 44.0, 27.0, 42.0, 30.0, 29.0, 43.0, 19.0, 27.0, 15.0, 18.0, 7.0, 14.0, 6.0, 10.0, 10.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.227935791015625, -2.14727783203125, -2.066619873046875, -1.9859619140625, -1.905303955078125, -1.82464599609375, -1.743988037109375, -1.663330078125, -1.582672119140625, -1.50201416015625, -1.421356201171875, -1.3406982421875, -1.260040283203125, -1.17938232421875, -1.098724365234375, -1.01806640625, -0.937408447265625, -0.85675048828125, -0.776092529296875, -0.6954345703125, -0.614776611328125, -0.53411865234375, -0.453460693359375, -0.372802734375, -0.292144775390625, -0.21148681640625, -0.130828857421875, -0.0501708984375, 0.030487060546875, 0.11114501953125, 0.191802978515625, 0.2724609375, 0.353118896484375, 0.43377685546875, 0.514434814453125, 0.5950927734375, 0.675750732421875, 0.75640869140625, 0.837066650390625, 0.917724609375, 0.998382568359375, 1.07904052734375, 1.159698486328125, 1.2403564453125, 1.321014404296875, 1.40167236328125, 1.482330322265625, 1.56298828125, 1.643646240234375, 1.72430419921875, 1.804962158203125, 1.8856201171875, 1.966278076171875, 2.04693603515625, 2.127593994140625, 2.208251953125, 2.288909912109375, 2.36956787109375, 2.450225830078125, 2.5308837890625, 2.611541748046875, 2.69219970703125, 2.772857666015625, 2.853515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 8.0, 10.0, 11.0, 31.0, 19.0, 33.0, 43.0, 56.0, 89.0, 113.0, 173.0, 270.0, 394.0, 686.0, 1222.0, 2349.0, 5340.0, 14366.0, 45327.0, 165083.0, 528799.0, 201674.0, 53898.0, 16646.0, 6065.0, 2463.0, 1285.0, 693.0, 418.0, 310.0, 213.0, 137.0, 90.0, 56.0, 44.0, 30.0, 24.0, 18.0, 10.0, 11.0, 8.0, 7.0, 2.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.1953125, -2.131805419921875, -2.06829833984375, -2.004791259765625, -1.9412841796875, -1.877777099609375, -1.81427001953125, -1.750762939453125, -1.687255859375, -1.623748779296875, -1.56024169921875, -1.496734619140625, -1.4332275390625, -1.369720458984375, -1.30621337890625, -1.242706298828125, -1.17919921875, -1.115692138671875, -1.05218505859375, -0.988677978515625, -0.9251708984375, -0.861663818359375, -0.79815673828125, -0.734649658203125, -0.671142578125, -0.607635498046875, -0.54412841796875, -0.480621337890625, -0.4171142578125, -0.353607177734375, -0.29010009765625, -0.226593017578125, -0.1630859375, -0.099578857421875, -0.03607177734375, 0.027435302734375, 0.0909423828125, 0.154449462890625, 0.21795654296875, 0.281463623046875, 0.344970703125, 0.408477783203125, 0.47198486328125, 0.535491943359375, 0.5989990234375, 0.662506103515625, 0.72601318359375, 0.789520263671875, 0.85302734375, 0.916534423828125, 0.98004150390625, 1.043548583984375, 1.1070556640625, 1.170562744140625, 1.23406982421875, 1.297576904296875, 1.361083984375, 1.424591064453125, 1.48809814453125, 1.551605224609375, 1.6151123046875, 1.678619384765625, 1.74212646484375, 1.805633544921875, 1.869140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 9.0, 17.0, 17.0, 20.0, 35.0, 48.0, 77.0, 177.0, 215.0, 119.0, 59.0, 39.0, 33.0, 33.0, 22.0, 12.0, 12.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005965232849121094, -0.0005809217691421509, -0.0005653202533721924, -0.0005497187376022339, -0.0005341172218322754, -0.0005185157060623169, -0.0005029141902923584, -0.0004873126745223999, -0.0004717111587524414, -0.0004561096429824829, -0.0004405081272125244, -0.0004249066114425659, -0.0004093050956726074, -0.0003937035799026489, -0.00037810206413269043, -0.00036250054836273193, -0.00034689903259277344, -0.00033129751682281494, -0.00031569600105285645, -0.00030009448528289795, -0.00028449296951293945, -0.00026889145374298096, -0.00025328993797302246, -0.00023768842220306396, -0.00022208690643310547, -0.00020648539066314697, -0.00019088387489318848, -0.00017528235912322998, -0.00015968084335327148, -0.000144079327583313, -0.0001284778118133545, -0.000112876296043396, -9.72747802734375e-05, -8.1673264503479e-05, -6.607174873352051e-05, -5.047023296356201e-05, -3.4868717193603516e-05, -1.926720142364502e-05, -3.6656856536865234e-06, 1.1935830116271973e-05, 2.753734588623047e-05, 4.3138861656188965e-05, 5.874037742614746e-05, 7.434189319610596e-05, 8.994340896606445e-05, 0.00010554492473602295, 0.00012114644050598145, 0.00013674795627593994, 0.00015234947204589844, 0.00016795098781585693, 0.00018355250358581543, 0.00019915401935577393, 0.00021475553512573242, 0.00023035705089569092, 0.0002459585666656494, 0.0002615600824356079, 0.0002771615982055664, 0.0002927631139755249, 0.0003083646297454834, 0.0003239661455154419, 0.0003395676612854004, 0.0003551691770553589, 0.0003707706928253174, 0.0003863722085952759, 0.0004019737243652344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 7.0, 9.0, 26.0, 29.0, 51.0, 64.0, 116.0, 174.0, 352.0, 515.0, 1152.0, 2830.0, 10514.0, 58951.0, 552304.0, 366933.0, 42021.0, 7875.0, 2458.0, 968.0, 491.0, 252.0, 165.0, 98.0, 71.0, 47.0, 21.0, 17.0, 8.0, 12.0, 2.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.018280029296875, -2.90179443359375, -2.785308837890625, -2.6688232421875, -2.552337646484375, -2.43585205078125, -2.319366455078125, -2.202880859375, -2.086395263671875, -1.96990966796875, -1.853424072265625, -1.7369384765625, -1.620452880859375, -1.50396728515625, -1.387481689453125, -1.27099609375, -1.154510498046875, -1.03802490234375, -0.921539306640625, -0.8050537109375, -0.688568115234375, -0.57208251953125, -0.455596923828125, -0.339111328125, -0.222625732421875, -0.10614013671875, 0.010345458984375, 0.1268310546875, 0.243316650390625, 0.35980224609375, 0.476287841796875, 0.5927734375, 0.709259033203125, 0.82574462890625, 0.942230224609375, 1.0587158203125, 1.175201416015625, 1.29168701171875, 1.408172607421875, 1.524658203125, 1.641143798828125, 1.75762939453125, 1.874114990234375, 1.9906005859375, 2.107086181640625, 2.22357177734375, 2.340057373046875, 2.45654296875, 2.573028564453125, 2.68951416015625, 2.805999755859375, 2.9224853515625, 3.038970947265625, 3.15545654296875, 3.271942138671875, 3.388427734375, 3.504913330078125, 3.62139892578125, 3.737884521484375, 3.8543701171875, 3.970855712890625, 4.08734130859375, 4.203826904296875, 4.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 3.0, 5.0, 11.0, 11.0, 8.0, 20.0, 11.0, 27.0, 21.0, 22.0, 35.0, 57.0, 64.0, 82.0, 99.0, 91.0, 95.0, 64.0, 47.0, 40.0, 33.0, 22.0, 31.0, 19.0, 17.0, 10.0, 6.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5433197021484375, -1.494842529296875, -1.4463653564453125, -1.39788818359375, -1.3494110107421875, -1.300933837890625, -1.2524566650390625, -1.2039794921875, -1.1555023193359375, -1.107025146484375, -1.0585479736328125, -1.01007080078125, -0.9615936279296875, -0.913116455078125, -0.8646392822265625, -0.816162109375, -0.7676849365234375, -0.719207763671875, -0.6707305908203125, -0.62225341796875, -0.5737762451171875, -0.525299072265625, -0.4768218994140625, -0.4283447265625, -0.3798675537109375, -0.331390380859375, -0.2829132080078125, -0.23443603515625, -0.1859588623046875, -0.137481689453125, -0.0890045166015625, -0.04052734375, 0.0079498291015625, 0.056427001953125, 0.1049041748046875, 0.15338134765625, 0.2018585205078125, 0.250335693359375, 0.2988128662109375, 0.3472900390625, 0.3957672119140625, 0.444244384765625, 0.4927215576171875, 0.54119873046875, 0.5896759033203125, 0.638153076171875, 0.6866302490234375, 0.735107421875, 0.7835845947265625, 0.832061767578125, 0.8805389404296875, 0.92901611328125, 0.9774932861328125, 1.025970458984375, 1.0744476318359375, 1.1229248046875, 1.1714019775390625, 1.219879150390625, 1.2683563232421875, 1.31683349609375, 1.3653106689453125, 1.413787841796875, 1.4622650146484375, 1.5107421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 18.0, 22.0, 29.0, 39.0, 61.0, 73.0, 92.0, 123.0, 118.0, 104.0, 96.0, 76.0, 55.0, 25.0, 27.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.383358001708984, -27.580856323242188, -26.778356552124023, -25.97585678100586, -25.173355102539062, -24.370853424072266, -23.5683536529541, -22.765853881835938, -21.96335220336914, -21.160850524902344, -20.35835075378418, -19.555850982666016, -18.75334930419922, -17.950847625732422, -17.148347854614258, -16.345848083496094, -15.543346405029297, -14.740845680236816, -13.938344955444336, -13.135844230651855, -12.333343505859375, -11.530842781066895, -10.728342056274414, -9.925841331481934, -9.123340606689453, -8.320839881896973, -7.518339157104492, -6.715838432312012, -5.913337707519531, -5.110836982727051, -4.30833625793457, -3.50583553314209, -2.7033329010009766, -1.900832176208496, -1.0983314514160156, -0.29583072662353516, 0.5066699981689453, 1.3091707229614258, 2.1116714477539062, 2.9141721725463867, 3.716672897338867, 4.519173622131348, 5.321674346923828, 6.124175071716309, 6.926675796508789, 7.7291765213012695, 8.53167724609375, 9.33417797088623, 10.136678695678711, 10.939179420471191, 11.741680145263672, 12.544180870056152, 13.346681594848633, 14.149182319641113, 14.951683044433594, 15.754183769226074, 16.556684494018555, 17.35918426513672, 18.161685943603516, 18.964187622070312, 19.766687393188477, 20.56918716430664, 21.371688842773438, 22.174190521240234, 22.9766902923584]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 9.0, 10.0, 14.0, 17.0, 32.0, 28.0, 25.0, 29.0, 38.0, 23.0, 37.0, 40.0, 38.0, 38.0, 34.0, 32.0, 40.0, 46.0, 44.0, 36.0, 34.0, 41.0, 34.0, 30.0, 25.0, 33.0, 28.0, 21.0, 21.0, 22.0, 20.0, 11.0, 10.0, 9.0, 9.0, 5.0, 11.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.834770202636719, -12.40081787109375, -11.966865539550781, -11.532912254333496, -11.098959922790527, -10.665007591247559, -10.23105525970459, -9.797101974487305, -9.363149642944336, -8.929197311401367, -8.495244979858398, -8.061291694641113, -7.6273393630981445, -7.193387031555176, -6.759434700012207, -6.32548189163208, -5.891529560089111, -5.457577228546143, -5.023624420166016, -4.589672088623047, -4.15571928024292, -3.721766948699951, -3.2878143787384033, -2.8538618087768555, -2.4199092388153076, -1.9859566688537598, -1.552004098892212, -1.1180516481399536, -0.6840990781784058, -0.25014662742614746, 0.1838059425354004, 0.6177585124969482, 1.051711082458496, 1.485663652420044, 1.9196162223815918, 2.3535685539245605, 2.7875213623046875, 3.2214736938476562, 3.655426263809204, 4.089378833770752, 4.523331642150879, 4.957283973693848, 5.391236782073975, 5.825189113616943, 6.25914192199707, 6.693094253540039, 7.127046585083008, 7.560999393463135, 7.9949517250061035, 8.42890453338623, 8.8628568649292, 9.296809196472168, 9.730761528015137, 10.164714813232422, 10.59866714477539, 11.03261947631836, 11.466571807861328, 11.900524139404297, 12.334476470947266, 12.76842975616455, 13.20238208770752, 13.636334419250488, 14.070286750793457, 14.504240036010742, 14.938192367553711]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 15.0, 13.0, 15.0, 20.0, 28.0, 35.0, 52.0, 102.0, 178.0, 372.0, 1047.0, 2986.0, 10929.0, 56191.0, 1604114.0, 2443819.0, 58097.0, 11534.0, 3001.0, 965.0, 346.0, 137.0, 74.0, 46.0, 34.0, 26.0, 20.0, 15.0, 12.0, 7.0, 7.0, 1.0, 10.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.6402587890625, -10.327392578125, -10.0145263671875, -9.70166015625, -9.3887939453125, -9.075927734375, -8.7630615234375, -8.4501953125, -8.1373291015625, -7.824462890625, -7.5115966796875, -7.19873046875, -6.8858642578125, -6.572998046875, -6.2601318359375, -5.947265625, -5.6343994140625, -5.321533203125, -5.0086669921875, -4.69580078125, -4.3829345703125, -4.070068359375, -3.7572021484375, -3.4443359375, -3.1314697265625, -2.818603515625, -2.5057373046875, -2.19287109375, -1.8800048828125, -1.567138671875, -1.2542724609375, -0.94140625, -0.6285400390625, -0.315673828125, -0.0028076171875, 0.31005859375, 0.6229248046875, 0.935791015625, 1.2486572265625, 1.5615234375, 1.8743896484375, 2.187255859375, 2.5001220703125, 2.81298828125, 3.1258544921875, 3.438720703125, 3.7515869140625, 4.064453125, 4.3773193359375, 4.690185546875, 5.0030517578125, 5.31591796875, 5.6287841796875, 5.941650390625, 6.2545166015625, 6.5673828125, 6.8802490234375, 7.193115234375, 7.5059814453125, 7.81884765625, 8.1317138671875, 8.444580078125, 8.7574462890625, 9.0703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 3.0, 8.0, 11.0, 17.0, 17.0, 15.0, 29.0, 33.0, 39.0, 44.0, 45.0, 39.0, 40.0, 48.0, 41.0, 53.0, 43.0, 43.0, 48.0, 56.0, 37.0, 40.0, 40.0, 29.0, 37.0, 27.0, 18.0, 10.0, 15.0, 14.0, 12.0, 13.0, 6.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.92041015625, -0.896636962890625, -0.87286376953125, -0.849090576171875, -0.8253173828125, -0.801544189453125, -0.77777099609375, -0.753997802734375, -0.730224609375, -0.706451416015625, -0.68267822265625, -0.658905029296875, -0.6351318359375, -0.611358642578125, -0.58758544921875, -0.563812255859375, -0.5400390625, -0.516265869140625, -0.49249267578125, -0.468719482421875, -0.4449462890625, -0.421173095703125, -0.39739990234375, -0.373626708984375, -0.349853515625, -0.326080322265625, -0.30230712890625, -0.278533935546875, -0.2547607421875, -0.230987548828125, -0.20721435546875, -0.183441162109375, -0.15966796875, -0.135894775390625, -0.11212158203125, -0.088348388671875, -0.0645751953125, -0.040802001953125, -0.01702880859375, 0.006744384765625, 0.030517578125, 0.054290771484375, 0.07806396484375, 0.101837158203125, 0.1256103515625, 0.149383544921875, 0.17315673828125, 0.196929931640625, 0.220703125, 0.244476318359375, 0.26824951171875, 0.292022705078125, 0.3157958984375, 0.339569091796875, 0.36334228515625, 0.387115478515625, 0.410888671875, 0.434661865234375, 0.45843505859375, 0.482208251953125, 0.5059814453125, 0.529754638671875, 0.55352783203125, 0.577301025390625, 0.60107421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 6.0, 7.0, 11.0, 16.0, 17.0, 24.0, 28.0, 64.0, 87.0, 105.0, 174.0, 294.0, 442.0, 784.0, 1504.0, 3116.0, 7099.0, 18831.0, 60121.0, 281249.0, 3189849.0, 501232.0, 86737.0, 25432.0, 9154.0, 3792.0, 1784.0, 933.0, 497.0, 288.0, 171.0, 128.0, 79.0, 66.0, 39.0, 29.0, 25.0, 18.0, 5.0, 11.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.13671875, -4.9884033203125, -4.840087890625, -4.6917724609375, -4.54345703125, -4.3951416015625, -4.246826171875, -4.0985107421875, -3.9501953125, -3.8018798828125, -3.653564453125, -3.5052490234375, -3.35693359375, -3.2086181640625, -3.060302734375, -2.9119873046875, -2.763671875, -2.6153564453125, -2.467041015625, -2.3187255859375, -2.17041015625, -2.0220947265625, -1.873779296875, -1.7254638671875, -1.5771484375, -1.4288330078125, -1.280517578125, -1.1322021484375, -0.98388671875, -0.8355712890625, -0.687255859375, -0.5389404296875, -0.390625, -0.2423095703125, -0.093994140625, 0.0543212890625, 0.20263671875, 0.3509521484375, 0.499267578125, 0.6475830078125, 0.7958984375, 0.9442138671875, 1.092529296875, 1.2408447265625, 1.38916015625, 1.5374755859375, 1.685791015625, 1.8341064453125, 1.982421875, 2.1307373046875, 2.279052734375, 2.4273681640625, 2.57568359375, 2.7239990234375, 2.872314453125, 3.0206298828125, 3.1689453125, 3.3172607421875, 3.465576171875, 3.6138916015625, 3.76220703125, 3.9105224609375, 4.058837890625, 4.2071533203125, 4.35546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 11.0, 8.0, 10.0, 15.0, 27.0, 29.0, 34.0, 46.0, 70.0, 152.0, 240.0, 517.0, 1509.0, 619.0, 287.0, 160.0, 113.0, 63.0, 44.0, 35.0, 27.0, 15.0, 11.0, 11.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.92578125, -1.8667144775390625, -1.807647705078125, -1.7485809326171875, -1.68951416015625, -1.6304473876953125, -1.571380615234375, -1.5123138427734375, -1.4532470703125, -1.3941802978515625, -1.335113525390625, -1.2760467529296875, -1.21697998046875, -1.1579132080078125, -1.098846435546875, -1.0397796630859375, -0.980712890625, -0.9216461181640625, -0.862579345703125, -0.8035125732421875, -0.74444580078125, -0.6853790283203125, -0.626312255859375, -0.5672454833984375, -0.5081787109375, -0.4491119384765625, -0.390045166015625, -0.3309783935546875, -0.27191162109375, -0.2128448486328125, -0.153778076171875, -0.0947113037109375, -0.03564453125, 0.0234222412109375, 0.082489013671875, 0.1415557861328125, 0.20062255859375, 0.2596893310546875, 0.318756103515625, 0.3778228759765625, 0.4368896484375, 0.4959564208984375, 0.555023193359375, 0.6140899658203125, 0.67315673828125, 0.7322235107421875, 0.791290283203125, 0.8503570556640625, 0.909423828125, 0.9684906005859375, 1.027557373046875, 1.0866241455078125, 1.14569091796875, 1.2047576904296875, 1.263824462890625, 1.3228912353515625, 1.3819580078125, 1.4410247802734375, 1.500091552734375, 1.5591583251953125, 1.61822509765625, 1.6772918701171875, 1.736358642578125, 1.7954254150390625, 1.8544921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 12.0, 11.0, 22.0, 27.0, 54.0, 71.0, 97.0, 106.0, 108.0, 102.0, 93.0, 90.0, 76.0, 37.0, 39.0, 17.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.358756065368652, -12.982189178466797, -12.605622291564941, -12.229055404663086, -11.852487564086914, -11.475920677185059, -11.099353790283203, -10.722786903381348, -10.346220016479492, -9.969653129577637, -9.593086242675781, -9.21651840209961, -8.839951515197754, -8.463384628295898, -8.086817741394043, -7.7102508544921875, -7.333683013916016, -6.95711612701416, -6.5805487632751465, -6.203981876373291, -5.827414512634277, -5.450847625732422, -5.074280738830566, -4.697713851928711, -4.321146488189697, -3.9445793628692627, -3.568012237548828, -3.1914453506469727, -2.814878225326538, -2.4383111000061035, -2.061744213104248, -1.6851770877838135, -1.3086109161376953, -0.9320438504219055, -0.5554767847061157, -0.1789097785949707, 0.19765734672546387, 0.5742244720458984, 0.9507913589477539, 1.3273584842681885, 1.703925609588623, 2.0804927349090576, 2.457059860229492, 2.8336267471313477, 3.2101938724517822, 3.586760997772217, 3.9633278846740723, 4.339895248413086, 4.716462135314941, 5.093029022216797, 5.4695963859558105, 5.846163272857666, 6.22273063659668, 6.599297523498535, 6.975864410400391, 7.352431297302246, 7.72899866104126, 8.105566024780273, 8.482132911682129, 8.858699798583984, 9.23526668548584, 9.611833572387695, 9.988401412963867, 10.364968299865723, 10.741535186767578]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 4.0, 9.0, 13.0, 12.0, 17.0, 24.0, 11.0, 12.0, 24.0, 27.0, 19.0, 35.0, 37.0, 44.0, 38.0, 25.0, 40.0, 37.0, 44.0, 46.0, 35.0, 34.0, 46.0, 42.0, 38.0, 35.0, 24.0, 19.0, 23.0, 14.0, 28.0, 14.0, 17.0, 16.0, 9.0, 11.0, 11.0, 5.0, 10.0, 9.0, 8.0, 4.0, 8.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.032009124755859, -4.871853351593018, -4.711697578430176, -4.551541805267334, -4.391386032104492, -4.23123025894165, -4.071074485778809, -3.910918951034546, -3.750763177871704, -3.5906074047088623, -3.4304516315460205, -3.2702958583831787, -3.110140323638916, -2.949984550476074, -2.7898287773132324, -2.6296730041503906, -2.469517230987549, -2.309361457824707, -2.1492056846618652, -1.989050030708313, -1.8288942575454712, -1.6687384843826294, -1.5085828304290771, -1.3484270572662354, -1.1882712841033936, -1.0281155109405518, -0.8679597973823547, -0.7078040838241577, -0.5476483106613159, -0.3874925374984741, -0.2273368239402771, -0.06718111038208008, 0.09297418594360352, 0.2531299293041229, 0.41328567266464233, 0.5734413862228394, 0.7335971593856812, 0.893752932548523, 1.0539085865020752, 1.214064359664917, 1.3742201328277588, 1.5343759059906006, 1.6945316791534424, 1.8546873331069946, 2.014842987060547, 2.1749987602233887, 2.3351545333862305, 2.4953103065490723, 2.655466079711914, 2.815621852874756, 2.9757776260375977, 3.1359333992004395, 3.2960891723632812, 3.456244945526123, 3.6164004802703857, 3.7765562534332275, 3.9367120265960693, 4.096867561340332, 4.257023334503174, 4.417179107666016, 4.577334880828857, 4.737490653991699, 4.897646427154541, 5.057802200317383, 5.217957973480225]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 20.0, 23.0, 41.0, 50.0, 96.0, 132.0, 217.0, 359.0, 626.0, 1131.0, 2165.0, 4524.0, 10060.0, 22579.0, 53820.0, 144422.0, 483586.0, 204193.0, 68064.0, 28656.0, 12441.0, 5544.0, 2630.0, 1352.0, 735.0, 397.0, 236.0, 140.0, 98.0, 63.0, 40.0, 32.0, 26.0, 13.0, 10.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.94140625, -4.8065185546875, -4.671630859375, -4.5367431640625, -4.40185546875, -4.2669677734375, -4.132080078125, -3.9971923828125, -3.8623046875, -3.7274169921875, -3.592529296875, -3.4576416015625, -3.32275390625, -3.1878662109375, -3.052978515625, -2.9180908203125, -2.783203125, -2.6483154296875, -2.513427734375, -2.3785400390625, -2.24365234375, -2.1087646484375, -1.973876953125, -1.8389892578125, -1.7041015625, -1.5692138671875, -1.434326171875, -1.2994384765625, -1.16455078125, -1.0296630859375, -0.894775390625, -0.7598876953125, -0.625, -0.4901123046875, -0.355224609375, -0.2203369140625, -0.08544921875, 0.0494384765625, 0.184326171875, 0.3192138671875, 0.4541015625, 0.5889892578125, 0.723876953125, 0.8587646484375, 0.99365234375, 1.1285400390625, 1.263427734375, 1.3983154296875, 1.533203125, 1.6680908203125, 1.802978515625, 1.9378662109375, 2.07275390625, 2.2076416015625, 2.342529296875, 2.4774169921875, 2.6123046875, 2.7471923828125, 2.882080078125, 3.0169677734375, 3.15185546875, 3.2867431640625, 3.421630859375, 3.5565185546875, 3.69140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 5.0, 14.0, 14.0, 18.0, 15.0, 25.0, 34.0, 30.0, 44.0, 40.0, 49.0, 44.0, 35.0, 52.0, 52.0, 49.0, 53.0, 46.0, 53.0, 38.0, 47.0, 35.0, 29.0, 21.0, 24.0, 28.0, 24.0, 15.0, 9.0, 11.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8926315307617188, -0.8677825927734375, -0.8429336547851562, -0.818084716796875, -0.7932357788085938, -0.7683868408203125, -0.7435379028320312, -0.71868896484375, -0.6938400268554688, -0.6689910888671875, -0.6441421508789062, -0.619293212890625, -0.5944442749023438, -0.5695953369140625, -0.5447463989257812, -0.5198974609375, -0.49504852294921875, -0.4701995849609375, -0.44535064697265625, -0.420501708984375, -0.39565277099609375, -0.3708038330078125, -0.34595489501953125, -0.32110595703125, -0.29625701904296875, -0.2714080810546875, -0.24655914306640625, -0.221710205078125, -0.19686126708984375, -0.1720123291015625, -0.14716339111328125, -0.122314453125, -0.09746551513671875, -0.0726165771484375, -0.04776763916015625, -0.022918701171875, 0.00193023681640625, 0.0267791748046875, 0.05162811279296875, 0.07647705078125, 0.10132598876953125, 0.1261749267578125, 0.15102386474609375, 0.175872802734375, 0.20072174072265625, 0.2255706787109375, 0.25041961669921875, 0.2752685546875, 0.30011749267578125, 0.3249664306640625, 0.34981536865234375, 0.374664306640625, 0.39951324462890625, 0.4243621826171875, 0.44921112060546875, 0.47406005859375, 0.49890899658203125, 0.5237579345703125, 0.5486068725585938, 0.573455810546875, 0.5983047485351562, 0.6231536865234375, 0.6480026245117188, 0.6728515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 4.0, 8.0, 10.0, 19.0, 24.0, 31.0, 40.0, 71.0, 71.0, 132.0, 217.0, 348.0, 627.0, 1316.0, 2737.0, 5690.0, 12325.0, 29132.0, 71253.0, 209367.0, 460719.0, 154270.0, 56817.0, 23625.0, 10245.0, 4682.0, 2229.0, 1061.0, 543.0, 337.0, 196.0, 132.0, 60.0, 49.0, 32.0, 31.0, 29.0, 19.0, 12.0, 6.0, 6.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.169677734375, -3.07177734375, -2.973876953125, -2.8759765625, -2.778076171875, -2.68017578125, -2.582275390625, -2.484375, -2.386474609375, -2.28857421875, -2.190673828125, -2.0927734375, -1.994873046875, -1.89697265625, -1.799072265625, -1.701171875, -1.603271484375, -1.50537109375, -1.407470703125, -1.3095703125, -1.211669921875, -1.11376953125, -1.015869140625, -0.91796875, -0.820068359375, -0.72216796875, -0.624267578125, -0.5263671875, -0.428466796875, -0.33056640625, -0.232666015625, -0.134765625, -0.036865234375, 0.06103515625, 0.158935546875, 0.2568359375, 0.354736328125, 0.45263671875, 0.550537109375, 0.6484375, 0.746337890625, 0.84423828125, 0.942138671875, 1.0400390625, 1.137939453125, 1.23583984375, 1.333740234375, 1.431640625, 1.529541015625, 1.62744140625, 1.725341796875, 1.8232421875, 1.921142578125, 2.01904296875, 2.116943359375, 2.21484375, 2.312744140625, 2.41064453125, 2.508544921875, 2.6064453125, 2.704345703125, 2.80224609375, 2.900146484375, 2.998046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 4.0, 11.0, 5.0, 10.0, 19.0, 24.0, 10.0, 28.0, 22.0, 40.0, 34.0, 35.0, 39.0, 50.0, 43.0, 42.0, 53.0, 46.0, 49.0, 49.0, 37.0, 48.0, 29.0, 38.0, 35.0, 36.0, 28.0, 18.0, 19.0, 20.0, 14.0, 10.0, 10.0, 8.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.868255615234375, -2.76971435546875, -2.671173095703125, -2.5726318359375, -2.474090576171875, -2.37554931640625, -2.277008056640625, -2.178466796875, -2.079925537109375, -1.98138427734375, -1.882843017578125, -1.7843017578125, -1.685760498046875, -1.58721923828125, -1.488677978515625, -1.39013671875, -1.291595458984375, -1.19305419921875, -1.094512939453125, -0.9959716796875, -0.897430419921875, -0.79888916015625, -0.700347900390625, -0.601806640625, -0.503265380859375, -0.40472412109375, -0.306182861328125, -0.2076416015625, -0.109100341796875, -0.01055908203125, 0.087982177734375, 0.1865234375, 0.285064697265625, 0.38360595703125, 0.482147216796875, 0.5806884765625, 0.679229736328125, 0.77777099609375, 0.876312255859375, 0.974853515625, 1.073394775390625, 1.17193603515625, 1.270477294921875, 1.3690185546875, 1.467559814453125, 1.56610107421875, 1.664642333984375, 1.76318359375, 1.861724853515625, 1.96026611328125, 2.058807373046875, 2.1573486328125, 2.255889892578125, 2.35443115234375, 2.452972412109375, 2.551513671875, 2.650054931640625, 2.74859619140625, 2.847137451171875, 2.9456787109375, 3.044219970703125, 3.14276123046875, 3.241302490234375, 3.33984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 9.0, 7.0, 15.0, 21.0, 22.0, 26.0, 58.0, 98.0, 171.0, 291.0, 585.0, 1416.0, 3615.0, 11328.0, 42348.0, 202293.0, 588810.0, 149580.0, 33189.0, 9181.0, 3117.0, 1172.0, 544.0, 274.0, 144.0, 84.0, 47.0, 36.0, 23.0, 11.0, 12.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.07421875, -2.010223388671875, -1.94622802734375, -1.882232666015625, -1.8182373046875, -1.754241943359375, -1.69024658203125, -1.626251220703125, -1.562255859375, -1.498260498046875, -1.43426513671875, -1.370269775390625, -1.3062744140625, -1.242279052734375, -1.17828369140625, -1.114288330078125, -1.05029296875, -0.986297607421875, -0.92230224609375, -0.858306884765625, -0.7943115234375, -0.730316162109375, -0.66632080078125, -0.602325439453125, -0.538330078125, -0.474334716796875, -0.41033935546875, -0.346343994140625, -0.2823486328125, -0.218353271484375, -0.15435791015625, -0.090362548828125, -0.0263671875, 0.037628173828125, 0.10162353515625, 0.165618896484375, 0.2296142578125, 0.293609619140625, 0.35760498046875, 0.421600341796875, 0.485595703125, 0.549591064453125, 0.61358642578125, 0.677581787109375, 0.7415771484375, 0.805572509765625, 0.86956787109375, 0.933563232421875, 0.99755859375, 1.061553955078125, 1.12554931640625, 1.189544677734375, 1.2535400390625, 1.317535400390625, 1.38153076171875, 1.445526123046875, 1.509521484375, 1.573516845703125, 1.63751220703125, 1.701507568359375, 1.7655029296875, 1.829498291015625, 1.89349365234375, 1.957489013671875, 2.021484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 6.0, 8.0, 15.0, 17.0, 17.0, 29.0, 49.0, 96.0, 209.0, 222.0, 123.0, 67.0, 39.0, 22.0, 17.0, 15.0, 14.0, 5.0, 2.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005578994750976562, -0.0005436614155769348, -0.0005294233560562134, -0.0005151852965354919, -0.0005009472370147705, -0.00048670917749404907, -0.00047247111797332764, -0.0004582330584526062, -0.00044399499893188477, -0.00042975693941116333, -0.0004155188798904419, -0.00040128082036972046, -0.000387042760848999, -0.0003728047013282776, -0.00035856664180755615, -0.0003443285822868347, -0.0003300905227661133, -0.00031585246324539185, -0.0003016144037246704, -0.000287376344203949, -0.00027313828468322754, -0.0002589002251625061, -0.00024466216564178467, -0.00023042410612106323, -0.0002161860466003418, -0.00020194798707962036, -0.00018770992755889893, -0.0001734718680381775, -0.00015923380851745605, -0.00014499574899673462, -0.00013075768947601318, -0.00011651962995529175, -0.00010228157043457031, -8.804351091384888e-05, -7.380545139312744e-05, -5.9567391872406006e-05, -4.532933235168457e-05, -3.1091272830963135e-05, -1.68532133102417e-05, -2.6151537895202637e-06, 1.1622905731201172e-05, 2.5860965251922607e-05, 4.009902477264404e-05, 5.433708429336548e-05, 6.857514381408691e-05, 8.281320333480835e-05, 9.705126285552979e-05, 0.00011128932237625122, 0.00012552738189697266, 0.0001397654414176941, 0.00015400350093841553, 0.00016824156045913696, 0.0001824796199798584, 0.00019671767950057983, 0.00021095573902130127, 0.0002251937985420227, 0.00023943185806274414, 0.0002536699175834656, 0.000267907977104187, 0.00028214603662490845, 0.0002963840961456299, 0.0003106221556663513, 0.00032486021518707275, 0.0003390982747077942, 0.0003533363342285156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 13.0, 21.0, 19.0, 31.0, 44.0, 61.0, 97.0, 149.0, 228.0, 324.0, 550.0, 945.0, 1713.0, 3335.0, 7070.0, 16720.0, 42765.0, 121977.0, 377153.0, 313120.0, 99697.0, 35655.0, 13942.0, 6225.0, 2915.0, 1467.0, 844.0, 506.0, 297.0, 207.0, 115.0, 98.0, 66.0, 45.0, 31.0, 18.0, 23.0, 19.0, 8.0, 4.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3955078125, -1.3503570556640625, -1.305206298828125, -1.2600555419921875, -1.21490478515625, -1.1697540283203125, -1.124603271484375, -1.0794525146484375, -1.0343017578125, -0.9891510009765625, -0.944000244140625, -0.8988494873046875, -0.85369873046875, -0.8085479736328125, -0.763397216796875, -0.7182464599609375, -0.673095703125, -0.6279449462890625, -0.582794189453125, -0.5376434326171875, -0.49249267578125, -0.4473419189453125, -0.402191162109375, -0.3570404052734375, -0.3118896484375, -0.2667388916015625, -0.221588134765625, -0.1764373779296875, -0.13128662109375, -0.0861358642578125, -0.040985107421875, 0.0041656494140625, 0.04931640625, 0.0944671630859375, 0.139617919921875, 0.1847686767578125, 0.22991943359375, 0.2750701904296875, 0.320220947265625, 0.3653717041015625, 0.4105224609375, 0.4556732177734375, 0.500823974609375, 0.5459747314453125, 0.59112548828125, 0.6362762451171875, 0.681427001953125, 0.7265777587890625, 0.771728515625, 0.8168792724609375, 0.862030029296875, 0.9071807861328125, 0.95233154296875, 0.9974822998046875, 1.042633056640625, 1.0877838134765625, 1.1329345703125, 1.1780853271484375, 1.223236083984375, 1.2683868408203125, 1.31353759765625, 1.3586883544921875, 1.403839111328125, 1.4489898681640625, 1.494140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 7.0, 12.0, 6.0, 18.0, 20.0, 15.0, 29.0, 34.0, 38.0, 38.0, 41.0, 55.0, 56.0, 83.0, 93.0, 72.0, 59.0, 48.0, 45.0, 31.0, 27.0, 31.0, 21.0, 30.0, 17.0, 13.0, 12.0, 5.0, 5.0, 6.0, 9.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.259765625, -1.2239227294921875, -1.188079833984375, -1.1522369384765625, -1.11639404296875, -1.0805511474609375, -1.044708251953125, -1.0088653564453125, -0.9730224609375, -0.9371795654296875, -0.901336669921875, -0.8654937744140625, -0.82965087890625, -0.7938079833984375, -0.757965087890625, -0.7221221923828125, -0.686279296875, -0.6504364013671875, -0.614593505859375, -0.5787506103515625, -0.54290771484375, -0.5070648193359375, -0.471221923828125, -0.4353790283203125, -0.3995361328125, -0.3636932373046875, -0.327850341796875, -0.2920074462890625, -0.25616455078125, -0.2203216552734375, -0.184478759765625, -0.1486358642578125, -0.11279296875, -0.0769500732421875, -0.041107177734375, -0.0052642822265625, 0.03057861328125, 0.0664215087890625, 0.102264404296875, 0.1381072998046875, 0.1739501953125, 0.2097930908203125, 0.245635986328125, 0.2814788818359375, 0.31732177734375, 0.3531646728515625, 0.389007568359375, 0.4248504638671875, 0.460693359375, 0.4965362548828125, 0.532379150390625, 0.5682220458984375, 0.60406494140625, 0.6399078369140625, 0.675750732421875, 0.7115936279296875, 0.7474365234375, 0.7832794189453125, 0.819122314453125, 0.8549652099609375, 0.89080810546875, 0.9266510009765625, 0.962493896484375, 0.9983367919921875, 1.0341796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 30.0, 59.0, 134.0, 207.0, 207.0, 144.0, 116.0, 56.0, 25.0, 12.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.401687622070312, -23.00246810913086, -21.603248596191406, -20.20402717590332, -18.804807662963867, -17.405588150024414, -16.006366729736328, -14.607147216796875, -13.207927703857422, -11.808708190917969, -10.4094877243042, -9.01026725769043, -7.611047744750977, -6.211827754974365, -4.812607765197754, -3.4133872985839844, -2.0141677856445312, -0.6149477958679199, 0.7842721939086914, 2.1834921836853027, 3.582712173461914, 4.981932163238525, 6.381152153015137, 7.780372619628906, 9.17959213256836, 10.578811645507812, 11.978032112121582, 13.377252578735352, 14.776472091674805, 16.175691604614258, 17.574913024902344, 18.974132537841797, 20.37335205078125, 21.772571563720703, 23.171791076660156, 24.571012496948242, 25.970232009887695, 27.36945152282715, 28.768672943115234, 30.167892456054688, 31.56711196899414, 32.966331481933594, 34.36555099487305, 35.7647705078125, 37.16399383544922, 38.56321334838867, 39.962432861328125, 41.36165237426758, 42.76087188720703, 44.160091400146484, 45.55931091308594, 46.95853042602539, 48.357749938964844, 49.75697326660156, 51.156192779541016, 52.55541229248047, 53.95463180541992, 55.353851318359375, 56.75307083129883, 58.15229034423828, 59.551513671875, 60.95073318481445, 62.349952697753906, 63.74917221069336, 65.14839172363281]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 10.0, 9.0, 16.0, 14.0, 23.0, 8.0, 18.0, 37.0, 20.0, 22.0, 37.0, 39.0, 46.0, 35.0, 34.0, 44.0, 47.0, 56.0, 26.0, 41.0, 34.0, 45.0, 40.0, 27.0, 38.0, 32.0, 22.0, 22.0, 19.0, 25.0, 17.0, 19.0, 11.0, 6.0, 10.0, 7.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.834763526916504, -12.426362037658691, -12.017960548400879, -11.60955810546875, -11.201156616210938, -10.792755126953125, -10.384353637695312, -9.9759521484375, -9.567549705505371, -9.159148216247559, -8.750746726989746, -8.342344284057617, -7.933942794799805, -7.525541305541992, -7.11713981628418, -6.708737850189209, -6.3003363609313965, -5.891934871673584, -5.483532905578613, -5.075131416320801, -4.66672945022583, -4.258327960968018, -3.849926233291626, -3.4415245056152344, -3.0331227779388428, -2.624721050262451, -2.2163193225860596, -1.8079177141189575, -1.399515986442566, -0.9911143779754639, -0.5827126502990723, -0.17431092262268066, 0.23409080505371094, 0.6424925327301025, 1.0508942604064941, 1.4592958688735962, 1.8676975965499878, 2.27609920501709, 2.6845009326934814, 3.092902660369873, 3.5013043880462646, 3.9097061157226562, 4.318107604980469, 4.7265095710754395, 5.134911060333252, 5.543313026428223, 5.951714515686035, 6.360116004943848, 6.768517971038818, 7.176919460296631, 7.585321426391602, 7.993722915649414, 8.402124404907227, 8.810525894165039, 9.218928337097168, 9.62732982635498, 10.035731315612793, 10.444132804870605, 10.852534294128418, 11.260936737060547, 11.66933822631836, 12.077739715576172, 12.486141204833984, 12.894542694091797, 13.302945137023926]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 13.0, 20.0, 29.0, 21.0, 40.0, 66.0, 83.0, 149.0, 188.0, 278.0, 497.0, 805.0, 1432.0, 2720.0, 5951.0, 13761.0, 39175.0, 154765.0, 3353515.0, 501782.0, 77039.0, 23940.0, 9056.0, 4198.0, 2013.0, 1096.0, 595.0, 381.0, 245.0, 132.0, 90.0, 53.0, 45.0, 32.0, 20.0, 16.0, 12.0, 11.0, 9.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.76995849609375, -6.5633544921875, -6.35675048828125, -6.150146484375, -5.94354248046875, -5.7369384765625, -5.53033447265625, -5.32373046875, -5.11712646484375, -4.9105224609375, -4.70391845703125, -4.497314453125, -4.29071044921875, -4.0841064453125, -3.87750244140625, -3.6708984375, -3.46429443359375, -3.2576904296875, -3.05108642578125, -2.844482421875, -2.63787841796875, -2.4312744140625, -2.22467041015625, -2.01806640625, -1.81146240234375, -1.6048583984375, -1.39825439453125, -1.191650390625, -0.98504638671875, -0.7784423828125, -0.57183837890625, -0.365234375, -0.15863037109375, 0.0479736328125, 0.25457763671875, 0.461181640625, 0.66778564453125, 0.8743896484375, 1.08099365234375, 1.28759765625, 1.49420166015625, 1.7008056640625, 1.90740966796875, 2.114013671875, 2.32061767578125, 2.5272216796875, 2.73382568359375, 2.9404296875, 3.14703369140625, 3.3536376953125, 3.56024169921875, 3.766845703125, 3.97344970703125, 4.1800537109375, 4.38665771484375, 4.59326171875, 4.79986572265625, 5.0064697265625, 5.21307373046875, 5.419677734375, 5.62628173828125, 5.8328857421875, 6.03948974609375, 6.24609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 12.0, 16.0, 14.0, 14.0, 16.0, 21.0, 24.0, 26.0, 43.0, 57.0, 36.0, 30.0, 46.0, 50.0, 48.0, 46.0, 51.0, 41.0, 45.0, 48.0, 48.0, 46.0, 33.0, 26.0, 23.0, 28.0, 15.0, 21.0, 15.0, 14.0, 11.0, 2.0, 6.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.89105224609375, -0.8665771484375, -0.84210205078125, -0.817626953125, -0.79315185546875, -0.7686767578125, -0.74420166015625, -0.7197265625, -0.69525146484375, -0.6707763671875, -0.64630126953125, -0.621826171875, -0.59735107421875, -0.5728759765625, -0.54840087890625, -0.52392578125, -0.49945068359375, -0.4749755859375, -0.45050048828125, -0.426025390625, -0.40155029296875, -0.3770751953125, -0.35260009765625, -0.328125, -0.30364990234375, -0.2791748046875, -0.25469970703125, -0.230224609375, -0.20574951171875, -0.1812744140625, -0.15679931640625, -0.13232421875, -0.10784912109375, -0.0833740234375, -0.05889892578125, -0.034423828125, -0.00994873046875, 0.0145263671875, 0.03900146484375, 0.0634765625, 0.08795166015625, 0.1124267578125, 0.13690185546875, 0.161376953125, 0.18585205078125, 0.2103271484375, 0.23480224609375, 0.25927734375, 0.28375244140625, 0.3082275390625, 0.33270263671875, 0.357177734375, 0.38165283203125, 0.4061279296875, 0.43060302734375, 0.455078125, 0.47955322265625, 0.5040283203125, 0.52850341796875, 0.552978515625, 0.57745361328125, 0.6019287109375, 0.62640380859375, 0.65087890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 13.0, 14.0, 26.0, 42.0, 47.0, 91.0, 150.0, 273.0, 497.0, 946.0, 1887.0, 3813.0, 8567.0, 19459.0, 50132.0, 161168.0, 2185521.0, 1525138.0, 153459.0, 48225.0, 18947.0, 8270.0, 3718.0, 1838.0, 905.0, 482.0, 270.0, 135.0, 78.0, 47.0, 37.0, 21.0, 18.0, 6.0, 10.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.508636474609375, -3.37860107421875, -3.248565673828125, -3.1185302734375, -2.988494873046875, -2.85845947265625, -2.728424072265625, -2.598388671875, -2.468353271484375, -2.33831787109375, -2.208282470703125, -2.0782470703125, -1.948211669921875, -1.81817626953125, -1.688140869140625, -1.55810546875, -1.428070068359375, -1.29803466796875, -1.167999267578125, -1.0379638671875, -0.907928466796875, -0.77789306640625, -0.647857666015625, -0.517822265625, -0.387786865234375, -0.25775146484375, -0.127716064453125, 0.0023193359375, 0.132354736328125, 0.26239013671875, 0.392425537109375, 0.5224609375, 0.652496337890625, 0.78253173828125, 0.912567138671875, 1.0426025390625, 1.172637939453125, 1.30267333984375, 1.432708740234375, 1.562744140625, 1.692779541015625, 1.82281494140625, 1.952850341796875, 2.0828857421875, 2.212921142578125, 2.34295654296875, 2.472991943359375, 2.60302734375, 2.733062744140625, 2.86309814453125, 2.993133544921875, 3.1231689453125, 3.253204345703125, 3.38323974609375, 3.513275146484375, 3.643310546875, 3.773345947265625, 3.90338134765625, 4.033416748046875, 4.1634521484375, 4.293487548828125, 4.42352294921875, 4.553558349609375, 4.68359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 9.0, 14.0, 16.0, 21.0, 30.0, 36.0, 60.0, 69.0, 109.0, 176.0, 349.0, 1415.0, 928.0, 310.0, 179.0, 88.0, 58.0, 55.0, 33.0, 25.0, 11.0, 17.0, 14.0, 9.0, 5.0, 11.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.602783203125, -1.54736328125, -1.491943359375, -1.4365234375, -1.381103515625, -1.32568359375, -1.270263671875, -1.21484375, -1.159423828125, -1.10400390625, -1.048583984375, -0.9931640625, -0.937744140625, -0.88232421875, -0.826904296875, -0.771484375, -0.716064453125, -0.66064453125, -0.605224609375, -0.5498046875, -0.494384765625, -0.43896484375, -0.383544921875, -0.328125, -0.272705078125, -0.21728515625, -0.161865234375, -0.1064453125, -0.051025390625, 0.00439453125, 0.059814453125, 0.115234375, 0.170654296875, 0.22607421875, 0.281494140625, 0.3369140625, 0.392333984375, 0.44775390625, 0.503173828125, 0.55859375, 0.614013671875, 0.66943359375, 0.724853515625, 0.7802734375, 0.835693359375, 0.89111328125, 0.946533203125, 1.001953125, 1.057373046875, 1.11279296875, 1.168212890625, 1.2236328125, 1.279052734375, 1.33447265625, 1.389892578125, 1.4453125, 1.500732421875, 1.55615234375, 1.611572265625, 1.6669921875, 1.722412109375, 1.77783203125, 1.833251953125, 1.888671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 7.0, 14.0, 20.0, 49.0, 52.0, 88.0, 133.0, 122.0, 110.0, 110.0, 94.0, 69.0, 41.0, 31.0, 17.0, 16.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.941224098205566, -10.575727462768555, -10.210230827331543, -9.844734191894531, -9.47923755645752, -9.113740921020508, -8.748244285583496, -8.382747650146484, -8.017251014709473, -7.651754379272461, -7.286257743835449, -6.9207611083984375, -6.555264472961426, -6.189767837524414, -5.824271202087402, -5.458774566650391, -5.093277931213379, -4.727781295776367, -4.3622846603393555, -3.9967880249023438, -3.631291389465332, -3.2657947540283203, -2.9002981185913086, -2.534801483154297, -2.169304847717285, -1.8038082122802734, -1.4383115768432617, -1.07281494140625, -0.7073183059692383, -0.34182167053222656, 0.023674964904785156, 0.3891716003417969, 0.754669189453125, 1.1201658248901367, 1.4856624603271484, 1.8511590957641602, 2.216655731201172, 2.5821523666381836, 2.9476490020751953, 3.313145637512207, 3.6786422729492188, 4.0441389083862305, 4.409635543823242, 4.775132179260254, 5.140628814697266, 5.506125450134277, 5.871622085571289, 6.237118721008301, 6.6026153564453125, 6.968111991882324, 7.333608627319336, 7.699105262756348, 8.06460189819336, 8.430098533630371, 8.795595169067383, 9.161091804504395, 9.526588439941406, 9.892085075378418, 10.25758171081543, 10.623078346252441, 10.988574981689453, 11.354071617126465, 11.719568252563477, 12.085064888000488, 12.4505615234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 14.0, 19.0, 24.0, 32.0, 41.0, 37.0, 37.0, 39.0, 39.0, 55.0, 58.0, 45.0, 30.0, 50.0, 61.0, 46.0, 52.0, 44.0, 32.0, 37.0, 35.0, 35.0, 29.0, 20.0, 15.0, 15.0, 9.0, 5.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.829183578491211, -7.616166591644287, -7.403149127960205, -7.190132141113281, -6.977114677429199, -6.764097690582275, -6.551080703735352, -6.3380632400512695, -6.125046253204346, -5.912029266357422, -5.69901180267334, -5.485994815826416, -5.272977828979492, -5.05996036529541, -4.846943378448486, -4.6339263916015625, -4.4209089279174805, -4.207891941070557, -3.9948744773864746, -3.781857490539551, -3.568840265274048, -3.355823040008545, -3.142806053161621, -2.929788827896118, -2.7167716026306152, -2.5037543773651123, -2.2907371520996094, -2.0777201652526855, -1.8647029399871826, -1.6516857147216797, -1.4386686086654663, -1.225651502609253, -1.01263427734375, -0.7996171116828918, -0.5865999460220337, -0.37358278036117554, -0.16056561470031738, 0.05245161056518555, 0.2654687166213989, 0.4784858226776123, 0.6915030479431152, 0.9045202136039734, 1.1175373792648315, 1.330554485321045, 1.5435717105865479, 1.7565889358520508, 1.9696060419082642, 2.1826231479644775, 2.3956403732299805, 2.6086575984954834, 2.8216748237609863, 3.03469181060791, 3.247709035873413, 3.460726261138916, 3.67374324798584, 3.8867604732513428, 4.099777698516846, 4.3127946853637695, 4.525812149047852, 4.738829135894775, 4.951846122741699, 5.164863586425781, 5.377880573272705, 5.590897560119629, 5.803915023803711]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 15.0, 15.0, 27.0, 60.0, 79.0, 155.0, 269.0, 390.0, 705.0, 1215.0, 2376.0, 4786.0, 10146.0, 23351.0, 55005.0, 126989.0, 282772.0, 298065.0, 136768.0, 58620.0, 25175.0, 10829.0, 5049.0, 2489.0, 1357.0, 769.0, 414.0, 260.0, 131.0, 113.0, 60.0, 35.0, 15.0, 14.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.62841796875, -3.4990234375, -3.36962890625, -3.240234375, -3.11083984375, -2.9814453125, -2.85205078125, -2.72265625, -2.59326171875, -2.4638671875, -2.33447265625, -2.205078125, -2.07568359375, -1.9462890625, -1.81689453125, -1.6875, -1.55810546875, -1.4287109375, -1.29931640625, -1.169921875, -1.04052734375, -0.9111328125, -0.78173828125, -0.65234375, -0.52294921875, -0.3935546875, -0.26416015625, -0.134765625, -0.00537109375, 0.1240234375, 0.25341796875, 0.3828125, 0.51220703125, 0.6416015625, 0.77099609375, 0.900390625, 1.02978515625, 1.1591796875, 1.28857421875, 1.41796875, 1.54736328125, 1.6767578125, 1.80615234375, 1.935546875, 2.06494140625, 2.1943359375, 2.32373046875, 2.453125, 2.58251953125, 2.7119140625, 2.84130859375, 2.970703125, 3.10009765625, 3.2294921875, 3.35888671875, 3.48828125, 3.61767578125, 3.7470703125, 3.87646484375, 4.005859375, 4.13525390625, 4.2646484375, 4.39404296875, 4.5234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 15.0, 10.0, 20.0, 20.0, 24.0, 24.0, 25.0, 36.0, 35.0, 42.0, 36.0, 50.0, 56.0, 34.0, 60.0, 55.0, 51.0, 52.0, 44.0, 35.0, 37.0, 39.0, 32.0, 29.0, 28.0, 22.0, 16.0, 13.0, 13.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9638671875, -0.9376373291015625, -0.911407470703125, -0.8851776123046875, -0.85894775390625, -0.8327178955078125, -0.806488037109375, -0.7802581787109375, -0.7540283203125, -0.7277984619140625, -0.701568603515625, -0.6753387451171875, -0.64910888671875, -0.6228790283203125, -0.596649169921875, -0.5704193115234375, -0.544189453125, -0.5179595947265625, -0.491729736328125, -0.4654998779296875, -0.43927001953125, -0.4130401611328125, -0.386810302734375, -0.3605804443359375, -0.3343505859375, -0.3081207275390625, -0.281890869140625, -0.2556610107421875, -0.22943115234375, -0.2032012939453125, -0.176971435546875, -0.1507415771484375, -0.12451171875, -0.0982818603515625, -0.072052001953125, -0.0458221435546875, -0.01959228515625, 0.0066375732421875, 0.032867431640625, 0.0590972900390625, 0.0853271484375, 0.1115570068359375, 0.137786865234375, 0.1640167236328125, 0.19024658203125, 0.2164764404296875, 0.242706298828125, 0.2689361572265625, 0.295166015625, 0.3213958740234375, 0.347625732421875, 0.3738555908203125, 0.40008544921875, 0.4263153076171875, 0.452545166015625, 0.4787750244140625, 0.5050048828125, 0.5312347412109375, 0.557464599609375, 0.5836944580078125, 0.60992431640625, 0.6361541748046875, 0.662384033203125, 0.6886138916015625, 0.71484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 7.0, 6.0, 12.0, 11.0, 21.0, 14.0, 25.0, 31.0, 51.0, 60.0, 72.0, 95.0, 141.0, 162.0, 239.0, 309.0, 401.0, 585.0, 1149.0, 2454.0, 7887.0, 30124.0, 119548.0, 401434.0, 348159.0, 98692.0, 24904.0, 6599.0, 2227.0, 1026.0, 575.0, 395.0, 277.0, 206.0, 144.0, 121.0, 93.0, 75.0, 55.0, 40.0, 30.0, 22.0, 22.0, 14.0, 10.0, 13.0, 10.0, 6.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.50006103515625, -4.3634033203125, -4.22674560546875, -4.090087890625, -3.95343017578125, -3.8167724609375, -3.68011474609375, -3.54345703125, -3.40679931640625, -3.2701416015625, -3.13348388671875, -2.996826171875, -2.86016845703125, -2.7235107421875, -2.58685302734375, -2.4501953125, -2.31353759765625, -2.1768798828125, -2.04022216796875, -1.903564453125, -1.76690673828125, -1.6302490234375, -1.49359130859375, -1.35693359375, -1.22027587890625, -1.0836181640625, -0.94696044921875, -0.810302734375, -0.67364501953125, -0.5369873046875, -0.40032958984375, -0.263671875, -0.12701416015625, 0.0096435546875, 0.14630126953125, 0.282958984375, 0.41961669921875, 0.5562744140625, 0.69293212890625, 0.82958984375, 0.96624755859375, 1.1029052734375, 1.23956298828125, 1.376220703125, 1.51287841796875, 1.6495361328125, 1.78619384765625, 1.9228515625, 2.05950927734375, 2.1961669921875, 2.33282470703125, 2.469482421875, 2.60614013671875, 2.7427978515625, 2.87945556640625, 3.01611328125, 3.15277099609375, 3.2894287109375, 3.42608642578125, 3.562744140625, 3.69940185546875, 3.8360595703125, 3.97271728515625, 4.109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 4.0, 10.0, 11.0, 14.0, 14.0, 13.0, 15.0, 27.0, 21.0, 18.0, 27.0, 21.0, 35.0, 28.0, 35.0, 30.0, 42.0, 37.0, 34.0, 40.0, 46.0, 43.0, 38.0, 30.0, 23.0, 36.0, 25.0, 35.0, 28.0, 25.0, 25.0, 20.0, 16.0, 9.0, 20.0, 15.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.69921875, -2.61529541015625, -2.5313720703125, -2.44744873046875, -2.363525390625, -2.27960205078125, -2.1956787109375, -2.11175537109375, -2.02783203125, -1.94390869140625, -1.8599853515625, -1.77606201171875, -1.692138671875, -1.60821533203125, -1.5242919921875, -1.44036865234375, -1.3564453125, -1.27252197265625, -1.1885986328125, -1.10467529296875, -1.020751953125, -0.93682861328125, -0.8529052734375, -0.76898193359375, -0.68505859375, -0.60113525390625, -0.5172119140625, -0.43328857421875, -0.349365234375, -0.26544189453125, -0.1815185546875, -0.09759521484375, -0.013671875, 0.07025146484375, 0.1541748046875, 0.23809814453125, 0.322021484375, 0.40594482421875, 0.4898681640625, 0.57379150390625, 0.65771484375, 0.74163818359375, 0.8255615234375, 0.90948486328125, 0.993408203125, 1.07733154296875, 1.1612548828125, 1.24517822265625, 1.3291015625, 1.41302490234375, 1.4969482421875, 1.58087158203125, 1.664794921875, 1.74871826171875, 1.8326416015625, 1.91656494140625, 2.00048828125, 2.08441162109375, 2.1683349609375, 2.25225830078125, 2.336181640625, 2.42010498046875, 2.5040283203125, 2.58795166015625, 2.671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 20.0, 34.0, 84.0, 150.0, 347.0, 949.0, 3109.0, 12875.0, 75536.0, 542480.0, 352276.0, 48088.0, 9005.0, 2271.0, 736.0, 282.0, 122.0, 66.0, 37.0, 26.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.447265625, -3.34552001953125, -3.2437744140625, -3.14202880859375, -3.040283203125, -2.93853759765625, -2.8367919921875, -2.73504638671875, -2.63330078125, -2.53155517578125, -2.4298095703125, -2.32806396484375, -2.226318359375, -2.12457275390625, -2.0228271484375, -1.92108154296875, -1.8193359375, -1.71759033203125, -1.6158447265625, -1.51409912109375, -1.412353515625, -1.31060791015625, -1.2088623046875, -1.10711669921875, -1.00537109375, -0.90362548828125, -0.8018798828125, -0.70013427734375, -0.598388671875, -0.49664306640625, -0.3948974609375, -0.29315185546875, -0.19140625, -0.08966064453125, 0.0120849609375, 0.11383056640625, 0.215576171875, 0.31732177734375, 0.4190673828125, 0.52081298828125, 0.62255859375, 0.72430419921875, 0.8260498046875, 0.92779541015625, 1.029541015625, 1.13128662109375, 1.2330322265625, 1.33477783203125, 1.4365234375, 1.53826904296875, 1.6400146484375, 1.74176025390625, 1.843505859375, 1.94525146484375, 2.0469970703125, 2.14874267578125, 2.25048828125, 2.35223388671875, 2.4539794921875, 2.55572509765625, 2.657470703125, 2.75921630859375, 2.8609619140625, 2.96270751953125, 3.064453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 7.0, 12.0, 14.0, 14.0, 24.0, 23.0, 34.0, 50.0, 52.0, 70.0, 115.0, 141.0, 97.0, 68.0, 57.0, 56.0, 41.0, 16.0, 18.0, 18.0, 12.0, 12.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003597736358642578, -0.0003486238420009613, -0.0003374740481376648, -0.0003263242542743683, -0.0003151744604110718, -0.00030402466654777527, -0.00029287487268447876, -0.00028172507882118225, -0.00027057528495788574, -0.00025942549109458923, -0.0002482756972312927, -0.00023712590336799622, -0.0002259761095046997, -0.0002148263156414032, -0.0002036765217781067, -0.00019252672791481018, -0.00018137693405151367, -0.00017022714018821716, -0.00015907734632492065, -0.00014792755246162415, -0.00013677775859832764, -0.00012562796473503113, -0.00011447817087173462, -0.00010332837700843811, -9.21785831451416e-05, -8.102878928184509e-05, -6.987899541854858e-05, -5.8729201555252075e-05, -4.7579407691955566e-05, -3.642961382865906e-05, -2.527981996536255e-05, -1.413002610206604e-05, -2.9802322387695312e-06, 8.169561624526978e-06, 1.9319355487823486e-05, 3.0469149351119995e-05, 4.1618943214416504e-05, 5.276873707771301e-05, 6.391853094100952e-05, 7.506832480430603e-05, 8.621811866760254e-05, 9.736791253089905e-05, 0.00010851770639419556, 0.00011966750025749207, 0.00013081729412078857, 0.00014196708798408508, 0.0001531168818473816, 0.0001642666757106781, 0.0001754164695739746, 0.00018656626343727112, 0.00019771605730056763, 0.00020886585116386414, 0.00022001564502716064, 0.00023116543889045715, 0.00024231523275375366, 0.00025346502661705017, 0.0002646148204803467, 0.0002757646143436432, 0.0002869144082069397, 0.0002980642020702362, 0.0003092139959335327, 0.0003203637897968292, 0.00033151358366012573, 0.00034266337752342224, 0.00035381317138671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 18.0, 21.0, 49.0, 61.0, 178.0, 291.0, 579.0, 1510.0, 7453.0, 83461.0, 802126.0, 139032.0, 10368.0, 1938.0, 705.0, 308.0, 188.0, 97.0, 65.0, 35.0, 24.0, 13.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.16156005859375, -3.9989013671875, -3.83624267578125, -3.673583984375, -3.51092529296875, -3.3482666015625, -3.18560791015625, -3.02294921875, -2.86029052734375, -2.6976318359375, -2.53497314453125, -2.372314453125, -2.20965576171875, -2.0469970703125, -1.88433837890625, -1.7216796875, -1.55902099609375, -1.3963623046875, -1.23370361328125, -1.071044921875, -0.90838623046875, -0.7457275390625, -0.58306884765625, -0.42041015625, -0.25775146484375, -0.0950927734375, 0.06756591796875, 0.230224609375, 0.39288330078125, 0.5555419921875, 0.71820068359375, 0.880859375, 1.04351806640625, 1.2061767578125, 1.36883544921875, 1.531494140625, 1.69415283203125, 1.8568115234375, 2.01947021484375, 2.18212890625, 2.34478759765625, 2.5074462890625, 2.67010498046875, 2.832763671875, 2.99542236328125, 3.1580810546875, 3.32073974609375, 3.4833984375, 3.64605712890625, 3.8087158203125, 3.97137451171875, 4.134033203125, 4.29669189453125, 4.4593505859375, 4.62200927734375, 4.78466796875, 4.94732666015625, 5.1099853515625, 5.27264404296875, 5.435302734375, 5.59796142578125, 5.7606201171875, 5.92327880859375, 6.0859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 12.0, 15.0, 18.0, 23.0, 43.0, 47.0, 79.0, 79.0, 101.0, 134.0, 103.0, 79.0, 74.0, 48.0, 43.0, 25.0, 21.0, 16.0, 7.0, 12.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.712890625, -3.6252593994140625, -3.537628173828125, -3.4499969482421875, -3.36236572265625, -3.2747344970703125, -3.187103271484375, -3.0994720458984375, -3.0118408203125, -2.9242095947265625, -2.836578369140625, -2.7489471435546875, -2.66131591796875, -2.5736846923828125, -2.486053466796875, -2.3984222412109375, -2.310791015625, -2.2231597900390625, -2.135528564453125, -2.0478973388671875, -1.96026611328125, -1.8726348876953125, -1.785003662109375, -1.6973724365234375, -1.6097412109375, -1.5221099853515625, -1.434478759765625, -1.3468475341796875, -1.25921630859375, -1.1715850830078125, -1.083953857421875, -0.9963226318359375, -0.90869140625, -0.8210601806640625, -0.733428955078125, -0.6457977294921875, -0.55816650390625, -0.4705352783203125, -0.382904052734375, -0.2952728271484375, -0.2076416015625, -0.1200103759765625, -0.032379150390625, 0.0552520751953125, 0.14288330078125, 0.2305145263671875, 0.318145751953125, 0.4057769775390625, 0.493408203125, 0.5810394287109375, 0.668670654296875, 0.7563018798828125, 0.84393310546875, 0.9315643310546875, 1.019195556640625, 1.1068267822265625, 1.1944580078125, 1.2820892333984375, 1.369720458984375, 1.4573516845703125, 1.54498291015625, 1.6326141357421875, 1.720245361328125, 1.8078765869140625, 1.8955078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 15.0, 45.0, 90.0, 143.0, 188.0, 194.0, 135.0, 88.0, 51.0, 27.0, 10.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.40587615966797, -75.85062408447266, -74.29537200927734, -72.7401123046875, -71.18486022949219, -69.62960815429688, -68.07435607910156, -66.51910400390625, -64.96385192871094, -63.408599853515625, -61.85334396362305, -60.298091888427734, -58.74283981323242, -57.187583923339844, -55.63233184814453, -54.07707977294922, -52.52182388305664, -50.96657180786133, -49.41131591796875, -47.85606384277344, -46.300811767578125, -44.74555969238281, -43.190303802490234, -41.63505172729492, -40.079795837402344, -38.52454376220703, -36.96928787231445, -35.41403579711914, -33.85878372192383, -32.30352783203125, -30.748275756835938, -29.193023681640625, -27.637771606445312, -26.082517623901367, -24.527265548706055, -22.97201156616211, -21.416759490966797, -19.86150550842285, -18.306251525878906, -16.750999450683594, -15.195745468139648, -13.64049243927002, -12.08523941040039, -10.529985427856445, -8.974732398986816, -7.4194793701171875, -5.864225387573242, -4.308972358703613, -2.7537193298339844, -1.1984660625457764, 0.35678720474243164, 1.9120407104492188, 3.4672937393188477, 5.022546768188477, 6.577800750732422, 8.13305377960205, 9.68830680847168, 11.243559837341309, 12.798812866210938, 14.354066848754883, 15.909319877624512, 17.46457290649414, 19.019826889038086, 20.57508087158203, 22.130332946777344]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 3.0, 9.0, 6.0, 11.0, 14.0, 10.0, 21.0, 14.0, 24.0, 17.0, 25.0, 33.0, 22.0, 36.0, 39.0, 39.0, 36.0, 48.0, 46.0, 47.0, 43.0, 40.0, 48.0, 28.0, 40.0, 27.0, 44.0, 23.0, 39.0, 25.0, 22.0, 17.0, 17.0, 17.0, 13.0, 10.0, 5.0, 6.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.491778373718262, -14.00961971282959, -13.527462005615234, -13.045303344726562, -12.56314468383789, -12.080986022949219, -11.598828315734863, -11.116669654846191, -10.634511947631836, -10.152353286743164, -9.670195579528809, -9.188036918640137, -8.705878257751465, -8.22372055053711, -7.7415618896484375, -7.259403228759766, -6.777244567871094, -6.29508638381958, -5.812927722930908, -5.3307695388793945, -4.848610877990723, -4.366452693939209, -3.8842945098876953, -3.4021360874176025, -2.9199776649475098, -2.437819242477417, -1.9556609392166138, -1.4735026359558105, -0.9913442134857178, -0.509185791015625, -0.027027606964111328, 0.45513081550598145, 0.9372882843017578, 1.4194467067718506, 1.9016050100326538, 2.383763313293457, 2.86592173576355, 3.3480801582336426, 3.8302383422851562, 4.312397003173828, 4.794555187225342, 5.2767133712768555, 5.758872032165527, 6.241030216217041, 6.723188400268555, 7.205347061157227, 7.68750524520874, 8.169663429260254, 8.651822090148926, 9.133980751037598, 9.616138458251953, 10.098297119140625, 10.580455780029297, 11.062614440917969, 11.544772148132324, 12.026930809020996, 12.509088516235352, 12.991247177124023, 13.473404884338379, 13.95556354522705, 14.437722206115723, 14.919879913330078, 15.40203857421875, 15.884197235107422, 16.366355895996094]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 5.0, 16.0, 6.0, 14.0, 18.0, 31.0, 63.0, 93.0, 138.0, 215.0, 380.0, 615.0, 1164.0, 2210.0, 4621.0, 10457.0, 27132.0, 80971.0, 356018.0, 3137388.0, 428415.0, 92200.0, 30137.0, 11760.0, 5063.0, 2437.0, 1170.0, 609.0, 386.0, 221.0, 123.0, 84.0, 49.0, 25.0, 12.0, 9.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4140625, -5.26593017578125, -5.1177978515625, -4.96966552734375, -4.821533203125, -4.67340087890625, -4.5252685546875, -4.37713623046875, -4.22900390625, -4.08087158203125, -3.9327392578125, -3.78460693359375, -3.636474609375, -3.48834228515625, -3.3402099609375, -3.19207763671875, -3.0439453125, -2.89581298828125, -2.7476806640625, -2.59954833984375, -2.451416015625, -2.30328369140625, -2.1551513671875, -2.00701904296875, -1.85888671875, -1.71075439453125, -1.5626220703125, -1.41448974609375, -1.266357421875, -1.11822509765625, -0.9700927734375, -0.82196044921875, -0.673828125, -0.52569580078125, -0.3775634765625, -0.22943115234375, -0.081298828125, 0.06683349609375, 0.2149658203125, 0.36309814453125, 0.51123046875, 0.65936279296875, 0.8074951171875, 0.95562744140625, 1.103759765625, 1.25189208984375, 1.4000244140625, 1.54815673828125, 1.6962890625, 1.84442138671875, 1.9925537109375, 2.14068603515625, 2.288818359375, 2.43695068359375, 2.5850830078125, 2.73321533203125, 2.88134765625, 3.02947998046875, 3.1776123046875, 3.32574462890625, 3.473876953125, 3.62200927734375, 3.7701416015625, 3.91827392578125, 4.06640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 7.0, 14.0, 25.0, 19.0, 30.0, 24.0, 29.0, 45.0, 36.0, 45.0, 38.0, 49.0, 51.0, 42.0, 52.0, 49.0, 59.0, 42.0, 44.0, 43.0, 39.0, 33.0, 26.0, 35.0, 22.0, 17.0, 12.0, 13.0, 7.0, 12.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.98486328125, -0.9590682983398438, -0.9332733154296875, -0.9074783325195312, -0.881683349609375, -0.8558883666992188, -0.8300933837890625, -0.8042984008789062, -0.77850341796875, -0.7527084350585938, -0.7269134521484375, -0.7011184692382812, -0.675323486328125, -0.6495285034179688, -0.6237335205078125, -0.5979385375976562, -0.5721435546875, -0.5463485717773438, -0.5205535888671875, -0.49475860595703125, -0.468963623046875, -0.44316864013671875, -0.4173736572265625, -0.39157867431640625, -0.36578369140625, -0.33998870849609375, -0.3141937255859375, -0.28839874267578125, -0.262603759765625, -0.23680877685546875, -0.2110137939453125, -0.18521881103515625, -0.159423828125, -0.13362884521484375, -0.1078338623046875, -0.08203887939453125, -0.056243896484375, -0.03044891357421875, -0.0046539306640625, 0.02114105224609375, 0.04693603515625, 0.07273101806640625, 0.0985260009765625, 0.12432098388671875, 0.150115966796875, 0.17591094970703125, 0.2017059326171875, 0.22750091552734375, 0.2532958984375, 0.27909088134765625, 0.3048858642578125, 0.33068084716796875, 0.356475830078125, 0.38227081298828125, 0.4080657958984375, 0.43386077880859375, 0.45965576171875, 0.48545074462890625, 0.5112457275390625, 0.5370407104492188, 0.562835693359375, 0.5886306762695312, 0.6144256591796875, 0.6402206420898438, 0.666015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 11.0, 4.0, 4.0, 10.0, 11.0, 6.0, 22.0, 32.0, 31.0, 56.0, 101.0, 127.0, 241.0, 365.0, 586.0, 937.0, 1701.0, 3035.0, 5711.0, 11309.0, 23028.0, 50178.0, 124389.0, 393808.0, 2395041.0, 834677.0, 206992.0, 75928.0, 32903.0, 15526.0, 7856.0, 4239.0, 2219.0, 1232.0, 744.0, 464.0, 250.0, 156.0, 118.0, 76.0, 51.0, 32.0, 19.0, 13.0, 9.0, 13.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.580078125, -2.493316650390625, -2.40655517578125, -2.319793701171875, -2.2330322265625, -2.146270751953125, -2.05950927734375, -1.972747802734375, -1.885986328125, -1.799224853515625, -1.71246337890625, -1.625701904296875, -1.5389404296875, -1.452178955078125, -1.36541748046875, -1.278656005859375, -1.19189453125, -1.105133056640625, -1.01837158203125, -0.931610107421875, -0.8448486328125, -0.758087158203125, -0.67132568359375, -0.584564208984375, -0.497802734375, -0.411041259765625, -0.32427978515625, -0.237518310546875, -0.1507568359375, -0.063995361328125, 0.02276611328125, 0.109527587890625, 0.1962890625, 0.283050537109375, 0.36981201171875, 0.456573486328125, 0.5433349609375, 0.630096435546875, 0.71685791015625, 0.803619384765625, 0.890380859375, 0.977142333984375, 1.06390380859375, 1.150665283203125, 1.2374267578125, 1.324188232421875, 1.41094970703125, 1.497711181640625, 1.58447265625, 1.671234130859375, 1.75799560546875, 1.844757080078125, 1.9315185546875, 2.018280029296875, 2.10504150390625, 2.191802978515625, 2.278564453125, 2.365325927734375, 2.45208740234375, 2.538848876953125, 2.6256103515625, 2.712371826171875, 2.79913330078125, 2.885894775390625, 2.97265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 8.0, 3.0, 9.0, 10.0, 21.0, 22.0, 25.0, 38.0, 37.0, 81.0, 88.0, 121.0, 192.0, 340.0, 608.0, 1155.0, 472.0, 259.0, 129.0, 141.0, 81.0, 70.0, 44.0, 34.0, 21.0, 17.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.9970703125, -1.9354095458984375, -1.873748779296875, -1.8120880126953125, -1.75042724609375, -1.6887664794921875, -1.627105712890625, -1.5654449462890625, -1.5037841796875, -1.4421234130859375, -1.380462646484375, -1.3188018798828125, -1.25714111328125, -1.1954803466796875, -1.133819580078125, -1.0721588134765625, -1.010498046875, -0.9488372802734375, -0.887176513671875, -0.8255157470703125, -0.76385498046875, -0.7021942138671875, -0.640533447265625, -0.5788726806640625, -0.5172119140625, -0.4555511474609375, -0.393890380859375, -0.3322296142578125, -0.27056884765625, -0.2089080810546875, -0.147247314453125, -0.0855865478515625, -0.02392578125, 0.0377349853515625, 0.099395751953125, 0.1610565185546875, 0.22271728515625, 0.2843780517578125, 0.346038818359375, 0.4076995849609375, 0.4693603515625, 0.5310211181640625, 0.592681884765625, 0.6543426513671875, 0.71600341796875, 0.7776641845703125, 0.839324951171875, 0.9009857177734375, 0.962646484375, 1.0243072509765625, 1.085968017578125, 1.1476287841796875, 1.20928955078125, 1.2709503173828125, 1.332611083984375, 1.3942718505859375, 1.4559326171875, 1.5175933837890625, 1.579254150390625, 1.6409149169921875, 1.70257568359375, 1.7642364501953125, 1.825897216796875, 1.8875579833984375, 1.94921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 16.0, 19.0, 23.0, 33.0, 54.0, 87.0, 84.0, 119.0, 125.0, 85.0, 100.0, 77.0, 55.0, 32.0, 30.0, 19.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.284547805786133, -17.84395980834961, -17.40337371826172, -16.962785720825195, -16.522197723388672, -16.08161163330078, -15.641023635864258, -15.200435638427734, -14.759848594665527, -14.31926155090332, -13.878673553466797, -13.43808650970459, -12.997499465942383, -12.55691146850586, -12.116324424743652, -11.675737380981445, -11.235149383544922, -10.794562339782715, -10.353974342346191, -9.913387298583984, -9.472800254821777, -9.032212257385254, -8.591625213623047, -8.151037216186523, -7.710451126098633, -7.269863605499268, -6.8292765617370605, -6.388689041137695, -5.94810152053833, -5.507513999938965, -5.066926956176758, -4.626339435577393, -4.185751914978027, -3.745164632797241, -3.304577112197876, -2.86398983001709, -2.4234023094177246, -1.9828150272369385, -1.5422277450561523, -1.101640224456787, -0.661052942276001, -0.22046557068824768, 0.22012180089950562, 0.6607091426849365, 1.1012965440750122, 1.541883945465088, 1.982471227645874, 2.4230587482452393, 2.8636460304260254, 3.3042333126068115, 3.7448208332061768, 4.185408115386963, 4.625995635986328, 5.066582679748535, 5.5071702003479, 5.947757720947266, 6.388344764709473, 6.828932285308838, 7.269519329071045, 7.71010684967041, 8.150693893432617, 8.59128189086914, 9.031868934631348, 9.472455978393555, 9.913043975830078]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 16.0, 14.0, 14.0, 25.0, 32.0, 20.0, 23.0, 29.0, 40.0, 28.0, 41.0, 29.0, 43.0, 40.0, 43.0, 41.0, 45.0, 54.0, 35.0, 36.0, 27.0, 34.0, 34.0, 29.0, 38.0, 34.0, 13.0, 21.0, 16.0, 16.0, 14.0, 13.0, 7.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.650493621826172, -7.420549392700195, -7.190605640411377, -6.9606614112854, -6.730717658996582, -6.5007734298706055, -6.270829200744629, -6.0408854484558105, -5.810941219329834, -5.580996990203857, -5.351053237915039, -5.1211090087890625, -4.891165256500244, -4.661221027374268, -4.431277275085449, -4.201333045959473, -3.971389055252075, -3.7414450645446777, -3.5115010738372803, -3.281557083129883, -3.0516128540039062, -2.821668863296509, -2.5917248725891113, -2.3617806434631348, -2.1318368911743164, -1.901892900466919, -1.671948790550232, -1.4420047998428345, -1.2120606899261475, -0.98211669921875, -0.7521727085113525, -0.5222285985946655, -0.2922844886779785, -0.06234045326709747, 0.16760358214378357, 0.3975476026535034, 0.6274916529655457, 0.8574357032775879, 1.0873796939849854, 1.3173238039016724, 1.5472677946090698, 1.7772117853164673, 2.0071558952331543, 2.2370998859405518, 2.467043876647949, 2.696988105773926, 2.926931858062744, 3.1568760871887207, 3.386820077896118, 3.6167640686035156, 3.846708059310913, 4.0766520500183105, 4.306596279144287, 4.5365400314331055, 4.766484260559082, 4.996428489685059, 5.226372241973877, 5.4563164710998535, 5.686260223388672, 5.916204452514648, 6.146148204803467, 6.376092433929443, 6.606036186218262, 6.835980415344238, 7.065924644470215]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 12.0, 14.0, 16.0, 28.0, 38.0, 63.0, 69.0, 115.0, 147.0, 253.0, 374.0, 572.0, 893.0, 1452.0, 2294.0, 3889.0, 6867.0, 12672.0, 23852.0, 46673.0, 92229.0, 166855.0, 233197.0, 202409.0, 120829.0, 63017.0, 31883.0, 16504.0, 8776.0, 4888.0, 2880.0, 1685.0, 1069.0, 691.0, 404.0, 296.0, 192.0, 154.0, 80.0, 64.0, 31.0, 35.0, 24.0, 14.0, 17.0, 5.0, 4.0, 8.0, 2.0, 1.0, 5.0], "bins": [-2.94921875, -2.86663818359375, -2.7840576171875, -2.70147705078125, -2.618896484375, -2.53631591796875, -2.4537353515625, -2.37115478515625, -2.28857421875, -2.20599365234375, -2.1234130859375, -2.04083251953125, -1.958251953125, -1.87567138671875, -1.7930908203125, -1.71051025390625, -1.6279296875, -1.54534912109375, -1.4627685546875, -1.38018798828125, -1.297607421875, -1.21502685546875, -1.1324462890625, -1.04986572265625, -0.96728515625, -0.88470458984375, -0.8021240234375, -0.71954345703125, -0.636962890625, -0.55438232421875, -0.4718017578125, -0.38922119140625, -0.306640625, -0.22406005859375, -0.1414794921875, -0.05889892578125, 0.023681640625, 0.10626220703125, 0.1888427734375, 0.27142333984375, 0.35400390625, 0.43658447265625, 0.5191650390625, 0.60174560546875, 0.684326171875, 0.76690673828125, 0.8494873046875, 0.93206787109375, 1.0146484375, 1.09722900390625, 1.1798095703125, 1.26239013671875, 1.344970703125, 1.42755126953125, 1.5101318359375, 1.59271240234375, 1.67529296875, 1.75787353515625, 1.8404541015625, 1.92303466796875, 2.005615234375, 2.08819580078125, 2.1707763671875, 2.25335693359375, 2.3359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 11.0, 8.0, 6.0, 10.0, 25.0, 16.0, 21.0, 34.0, 25.0, 33.0, 40.0, 33.0, 55.0, 48.0, 44.0, 50.0, 47.0, 51.0, 49.0, 37.0, 50.0, 40.0, 44.0, 39.0, 39.0, 27.0, 25.0, 20.0, 16.0, 13.0, 9.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.037109375, -1.0096511840820312, -0.9821929931640625, -0.9547348022460938, -0.927276611328125, -0.8998184204101562, -0.8723602294921875, -0.8449020385742188, -0.81744384765625, -0.7899856567382812, -0.7625274658203125, -0.7350692749023438, -0.707611083984375, -0.6801528930664062, -0.6526947021484375, -0.6252365112304688, -0.5977783203125, -0.5703201293945312, -0.5428619384765625, -0.5154037475585938, -0.487945556640625, -0.46048736572265625, -0.4330291748046875, -0.40557098388671875, -0.37811279296875, -0.35065460205078125, -0.3231964111328125, -0.29573822021484375, -0.268280029296875, -0.24082183837890625, -0.2133636474609375, -0.18590545654296875, -0.158447265625, -0.13098907470703125, -0.1035308837890625, -0.07607269287109375, -0.048614501953125, -0.02115631103515625, 0.0063018798828125, 0.03376007080078125, 0.06121826171875, 0.08867645263671875, 0.1161346435546875, 0.14359283447265625, 0.171051025390625, 0.19850921630859375, 0.2259674072265625, 0.25342559814453125, 0.2808837890625, 0.30834197998046875, 0.3358001708984375, 0.36325836181640625, 0.390716552734375, 0.41817474365234375, 0.4456329345703125, 0.47309112548828125, 0.50054931640625, 0.5280075073242188, 0.5554656982421875, 0.5829238891601562, 0.610382080078125, 0.6378402709960938, 0.6652984619140625, 0.6927566528320312, 0.72021484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 11.0, 25.0, 21.0, 28.0, 38.0, 51.0, 62.0, 99.0, 157.0, 216.0, 276.0, 421.0, 638.0, 1212.0, 3435.0, 16036.0, 115001.0, 605115.0, 261858.0, 33715.0, 5958.0, 1748.0, 821.0, 509.0, 312.0, 209.0, 175.0, 108.0, 81.0, 58.0, 42.0, 34.0, 23.0, 16.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.5703125, -6.363037109375, -6.15576171875, -5.948486328125, -5.7412109375, -5.533935546875, -5.32666015625, -5.119384765625, -4.912109375, -4.704833984375, -4.49755859375, -4.290283203125, -4.0830078125, -3.875732421875, -3.66845703125, -3.461181640625, -3.25390625, -3.046630859375, -2.83935546875, -2.632080078125, -2.4248046875, -2.217529296875, -2.01025390625, -1.802978515625, -1.595703125, -1.388427734375, -1.18115234375, -0.973876953125, -0.7666015625, -0.559326171875, -0.35205078125, -0.144775390625, 0.0625, 0.269775390625, 0.47705078125, 0.684326171875, 0.8916015625, 1.098876953125, 1.30615234375, 1.513427734375, 1.720703125, 1.927978515625, 2.13525390625, 2.342529296875, 2.5498046875, 2.757080078125, 2.96435546875, 3.171630859375, 3.37890625, 3.586181640625, 3.79345703125, 4.000732421875, 4.2080078125, 4.415283203125, 4.62255859375, 4.829833984375, 5.037109375, 5.244384765625, 5.45166015625, 5.658935546875, 5.8662109375, 6.073486328125, 6.28076171875, 6.488037109375, 6.6953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 8.0, 4.0, 5.0, 10.0, 9.0, 16.0, 21.0, 14.0, 9.0, 30.0, 22.0, 30.0, 33.0, 36.0, 47.0, 35.0, 35.0, 48.0, 40.0, 52.0, 39.0, 54.0, 51.0, 38.0, 34.0, 47.0, 34.0, 32.0, 25.0, 26.0, 31.0, 11.0, 8.0, 18.0, 9.0, 14.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.515625, -3.399932861328125, -3.28424072265625, -3.168548583984375, -3.0528564453125, -2.937164306640625, -2.82147216796875, -2.705780029296875, -2.590087890625, -2.474395751953125, -2.35870361328125, -2.243011474609375, -2.1273193359375, -2.011627197265625, -1.89593505859375, -1.780242919921875, -1.66455078125, -1.548858642578125, -1.43316650390625, -1.317474365234375, -1.2017822265625, -1.086090087890625, -0.97039794921875, -0.854705810546875, -0.739013671875, -0.623321533203125, -0.50762939453125, -0.391937255859375, -0.2762451171875, -0.160552978515625, -0.04486083984375, 0.070831298828125, 0.1865234375, 0.302215576171875, 0.41790771484375, 0.533599853515625, 0.6492919921875, 0.764984130859375, 0.88067626953125, 0.996368408203125, 1.112060546875, 1.227752685546875, 1.34344482421875, 1.459136962890625, 1.5748291015625, 1.690521240234375, 1.80621337890625, 1.921905517578125, 2.03759765625, 2.153289794921875, 2.26898193359375, 2.384674072265625, 2.5003662109375, 2.616058349609375, 2.73175048828125, 2.847442626953125, 2.963134765625, 3.078826904296875, 3.19451904296875, 3.310211181640625, 3.4259033203125, 3.541595458984375, 3.65728759765625, 3.772979736328125, 3.888671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 16.0, 26.0, 33.0, 40.0, 91.0, 138.0, 245.0, 524.0, 1373.0, 4625.0, 19471.0, 103487.0, 440109.0, 375860.0, 80921.0, 15568.0, 3653.0, 1248.0, 479.0, 269.0, 125.0, 73.0, 51.0, 29.0, 18.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.424072265625, -2.34814453125, -2.272216796875, -2.1962890625, -2.120361328125, -2.04443359375, -1.968505859375, -1.892578125, -1.816650390625, -1.74072265625, -1.664794921875, -1.5888671875, -1.512939453125, -1.43701171875, -1.361083984375, -1.28515625, -1.209228515625, -1.13330078125, -1.057373046875, -0.9814453125, -0.905517578125, -0.82958984375, -0.753662109375, -0.677734375, -0.601806640625, -0.52587890625, -0.449951171875, -0.3740234375, -0.298095703125, -0.22216796875, -0.146240234375, -0.0703125, 0.005615234375, 0.08154296875, 0.157470703125, 0.2333984375, 0.309326171875, 0.38525390625, 0.461181640625, 0.537109375, 0.613037109375, 0.68896484375, 0.764892578125, 0.8408203125, 0.916748046875, 0.99267578125, 1.068603515625, 1.14453125, 1.220458984375, 1.29638671875, 1.372314453125, 1.4482421875, 1.524169921875, 1.60009765625, 1.676025390625, 1.751953125, 1.827880859375, 1.90380859375, 1.979736328125, 2.0556640625, 2.131591796875, 2.20751953125, 2.283447265625, 2.359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 8.0, 7.0, 8.0, 8.0, 8.0, 14.0, 22.0, 37.0, 33.0, 31.0, 45.0, 48.0, 54.0, 44.0, 79.0, 75.0, 62.0, 66.0, 44.0, 43.0, 37.0, 42.0, 27.0, 14.0, 22.0, 23.0, 14.0, 22.0, 8.0, 12.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002522468566894531, -0.0002439543604850769, -0.00023566186428070068, -0.00022736936807632446, -0.00021907687187194824, -0.00021078437566757202, -0.0002024918794631958, -0.00019419938325881958, -0.00018590688705444336, -0.00017761439085006714, -0.00016932189464569092, -0.0001610293984413147, -0.00015273690223693848, -0.00014444440603256226, -0.00013615190982818604, -0.00012785941362380981, -0.0001195669174194336, -0.00011127442121505737, -0.00010298192501068115, -9.468942880630493e-05, -8.639693260192871e-05, -7.810443639755249e-05, -6.981194019317627e-05, -6.151944398880005e-05, -5.322694778442383e-05, -4.493445158004761e-05, -3.664195537567139e-05, -2.8349459171295166e-05, -2.0056962966918945e-05, -1.1764466762542725e-05, -3.471970558166504e-06, 4.820525646209717e-06, 1.3113021850585938e-05, 2.1405518054962158e-05, 2.969801425933838e-05, 3.79905104637146e-05, 4.628300666809082e-05, 5.457550287246704e-05, 6.286799907684326e-05, 7.116049528121948e-05, 7.94529914855957e-05, 8.774548768997192e-05, 9.603798389434814e-05, 0.00010433048009872437, 0.00011262297630310059, 0.0001209154725074768, 0.00012920796871185303, 0.00013750046491622925, 0.00014579296112060547, 0.0001540854573249817, 0.0001623779535293579, 0.00017067044973373413, 0.00017896294593811035, 0.00018725544214248657, 0.0001955479383468628, 0.00020384043455123901, 0.00021213293075561523, 0.00022042542695999146, 0.00022871792316436768, 0.0002370104193687439, 0.0002453029155731201, 0.00025359541177749634, 0.00026188790798187256, 0.0002701804041862488, 0.000278472900390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 8.0, 13.0, 24.0, 25.0, 38.0, 58.0, 89.0, 132.0, 198.0, 318.0, 605.0, 1206.0, 3050.0, 12633.0, 90787.0, 499662.0, 370947.0, 55511.0, 8559.0, 2289.0, 1010.0, 532.0, 315.0, 182.0, 113.0, 78.0, 52.0, 33.0, 22.0, 13.0, 9.0, 8.0, 1.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.85546875, -2.765899658203125, -2.67633056640625, -2.586761474609375, -2.4971923828125, -2.407623291015625, -2.31805419921875, -2.228485107421875, -2.138916015625, -2.049346923828125, -1.95977783203125, -1.870208740234375, -1.7806396484375, -1.691070556640625, -1.60150146484375, -1.511932373046875, -1.42236328125, -1.332794189453125, -1.24322509765625, -1.153656005859375, -1.0640869140625, -0.974517822265625, -0.88494873046875, -0.795379638671875, -0.705810546875, -0.616241455078125, -0.52667236328125, -0.437103271484375, -0.3475341796875, -0.257965087890625, -0.16839599609375, -0.078826904296875, 0.0107421875, 0.100311279296875, 0.18988037109375, 0.279449462890625, 0.3690185546875, 0.458587646484375, 0.54815673828125, 0.637725830078125, 0.727294921875, 0.816864013671875, 0.90643310546875, 0.996002197265625, 1.0855712890625, 1.175140380859375, 1.26470947265625, 1.354278564453125, 1.44384765625, 1.533416748046875, 1.62298583984375, 1.712554931640625, 1.8021240234375, 1.891693115234375, 1.98126220703125, 2.070831298828125, 2.160400390625, 2.249969482421875, 2.33953857421875, 2.429107666015625, 2.5186767578125, 2.608245849609375, 2.69781494140625, 2.787384033203125, 2.876953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 16.0, 20.0, 29.0, 34.0, 44.0, 65.0, 45.0, 66.0, 92.0, 95.0, 87.0, 75.0, 65.0, 63.0, 40.0, 39.0, 30.0, 24.0, 20.0, 12.0, 13.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3372344970703125, -1.275054931640625, -1.2128753662109375, -1.15069580078125, -1.0885162353515625, -1.026336669921875, -0.9641571044921875, -0.9019775390625, -0.8397979736328125, -0.777618408203125, -0.7154388427734375, -0.65325927734375, -0.5910797119140625, -0.528900146484375, -0.4667205810546875, -0.404541015625, -0.3423614501953125, -0.280181884765625, -0.2180023193359375, -0.15582275390625, -0.0936431884765625, -0.031463623046875, 0.0307159423828125, 0.0928955078125, 0.1550750732421875, 0.217254638671875, 0.2794342041015625, 0.34161376953125, 0.4037933349609375, 0.465972900390625, 0.5281524658203125, 0.59033203125, 0.6525115966796875, 0.714691162109375, 0.7768707275390625, 0.83905029296875, 0.9012298583984375, 0.963409423828125, 1.0255889892578125, 1.0877685546875, 1.1499481201171875, 1.212127685546875, 1.2743072509765625, 1.33648681640625, 1.3986663818359375, 1.460845947265625, 1.5230255126953125, 1.585205078125, 1.6473846435546875, 1.709564208984375, 1.7717437744140625, 1.83392333984375, 1.8961029052734375, 1.958282470703125, 2.0204620361328125, 2.0826416015625, 2.1448211669921875, 2.207000732421875, 2.2691802978515625, 2.33135986328125, 2.3935394287109375, 2.455718994140625, 2.5178985595703125, 2.580078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 12.0, 21.0, 46.0, 85.0, 165.0, 219.0, 206.0, 144.0, 58.0, 31.0, 16.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.44492721557617, -60.64997482299805, -58.855018615722656, -57.06006622314453, -55.26511001586914, -53.470157623291016, -51.675201416015625, -49.8802490234375, -48.085296630859375, -46.29034423828125, -44.49538803100586, -42.700435638427734, -40.905479431152344, -39.11052703857422, -37.315574645996094, -35.5206184387207, -33.72566223144531, -31.930707931518555, -30.135753631591797, -28.340801239013672, -26.54584503173828, -24.750892639160156, -22.9559383392334, -21.16098403930664, -19.366029739379883, -17.571075439453125, -15.776121139526367, -13.981167793273926, -12.186213493347168, -10.39125919342041, -8.596305847167969, -6.801351547241211, -5.006401062011719, -3.21144700050354, -1.4164929389953613, 0.3784608840942383, 2.173415184020996, 3.968369483947754, 5.763322830200195, 7.558277130126953, 9.353231430053711, 11.148185729980469, 12.943140029907227, 14.738093376159668, 16.53304672241211, 18.3280029296875, 20.122955322265625, 21.917909622192383, 23.71286392211914, 25.5078182220459, 27.302772521972656, 29.09772491455078, 30.892681121826172, 32.6876335144043, 34.48258972167969, 36.27754211425781, 38.07249450683594, 39.86744689941406, 41.66240310668945, 43.45735549926758, 45.25231170654297, 47.047264099121094, 48.84221649169922, 50.63717269897461, 52.43212890625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 2.0, 9.0, 5.0, 12.0, 11.0, 10.0, 17.0, 14.0, 27.0, 25.0, 18.0, 18.0, 40.0, 43.0, 41.0, 39.0, 36.0, 43.0, 41.0, 40.0, 39.0, 45.0, 40.0, 38.0, 51.0, 39.0, 34.0, 32.0, 20.0, 32.0, 27.0, 20.0, 11.0, 18.0, 14.0, 8.0, 7.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.701343536376953, -16.108783721923828, -15.516223907470703, -14.923663139343262, -14.331103324890137, -13.738543510437012, -13.14598274230957, -12.553422927856445, -11.96086311340332, -11.368303298950195, -10.77574348449707, -10.183182716369629, -9.590622901916504, -8.998063087463379, -8.405502319335938, -7.8129425048828125, -7.2203826904296875, -6.6278228759765625, -6.035262584686279, -5.442702293395996, -4.850142478942871, -4.257582664489746, -3.665022373199463, -3.0724620819091797, -2.4799022674560547, -1.8873422145843506, -1.2947821617126465, -0.7022221088409424, -0.10966205596923828, 0.4828979969024658, 1.07545804977417, 1.6680183410644531, 2.260580062866211, 2.853140115737915, 3.445700168609619, 4.038260459899902, 4.630820274353027, 5.223380088806152, 5.8159403800964355, 6.408500671386719, 7.001060485839844, 7.593620300292969, 8.186180114746094, 8.778740882873535, 9.37130069732666, 9.963860511779785, 10.556421279907227, 11.148981094360352, 11.741540908813477, 12.334100723266602, 12.926660537719727, 13.519221305847168, 14.111781120300293, 14.704340934753418, 15.29690170288086, 15.889461517333984, 16.48202133178711, 17.074581146240234, 17.66714096069336, 18.259700775146484, 18.85226058959961, 19.444822311401367, 20.037382125854492, 20.629941940307617, 21.222501754760742]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 5.0, 7.0, 18.0, 29.0, 34.0, 50.0, 79.0, 120.0, 154.0, 232.0, 327.0, 595.0, 1151.0, 2432.0, 7658.0, 56968.0, 4056076.0, 55495.0, 7590.0, 2500.0, 1086.0, 606.0, 324.0, 228.0, 153.0, 97.0, 70.0, 50.0, 41.0, 21.0, 13.0, 14.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.112060546875, -12.73193359375, -12.351806640625, -11.9716796875, -11.591552734375, -11.21142578125, -10.831298828125, -10.451171875, -10.071044921875, -9.69091796875, -9.310791015625, -8.9306640625, -8.550537109375, -8.17041015625, -7.790283203125, -7.41015625, -7.030029296875, -6.64990234375, -6.269775390625, -5.8896484375, -5.509521484375, -5.12939453125, -4.749267578125, -4.369140625, -3.989013671875, -3.60888671875, -3.228759765625, -2.8486328125, -2.468505859375, -2.08837890625, -1.708251953125, -1.328125, -0.947998046875, -0.56787109375, -0.187744140625, 0.1923828125, 0.572509765625, 0.95263671875, 1.332763671875, 1.712890625, 2.093017578125, 2.47314453125, 2.853271484375, 3.2333984375, 3.613525390625, 3.99365234375, 4.373779296875, 4.75390625, 5.134033203125, 5.51416015625, 5.894287109375, 6.2744140625, 6.654541015625, 7.03466796875, 7.414794921875, 7.794921875, 8.175048828125, 8.55517578125, 8.935302734375, 9.3154296875, 9.695556640625, 10.07568359375, 10.455810546875, 10.8359375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 13.0, 18.0, 28.0, 31.0, 39.0, 39.0, 40.0, 53.0, 52.0, 52.0, 48.0, 64.0, 54.0, 53.0, 58.0, 59.0, 46.0, 39.0, 36.0, 31.0, 25.0, 19.0, 22.0, 12.0, 6.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1056976318359375, -1.072723388671875, -1.0397491455078125, -1.00677490234375, -0.9738006591796875, -0.940826416015625, -0.9078521728515625, -0.8748779296875, -0.8419036865234375, -0.808929443359375, -0.7759552001953125, -0.74298095703125, -0.7100067138671875, -0.677032470703125, -0.6440582275390625, -0.611083984375, -0.5781097412109375, -0.545135498046875, -0.5121612548828125, -0.47918701171875, -0.4462127685546875, -0.413238525390625, -0.3802642822265625, -0.3472900390625, -0.3143157958984375, -0.281341552734375, -0.2483673095703125, -0.21539306640625, -0.1824188232421875, -0.149444580078125, -0.1164703369140625, -0.08349609375, -0.0505218505859375, -0.017547607421875, 0.0154266357421875, 0.04840087890625, 0.0813751220703125, 0.114349365234375, 0.1473236083984375, 0.1802978515625, 0.2132720947265625, 0.246246337890625, 0.2792205810546875, 0.31219482421875, 0.3451690673828125, 0.378143310546875, 0.4111175537109375, 0.444091796875, 0.4770660400390625, 0.510040283203125, 0.5430145263671875, 0.57598876953125, 0.6089630126953125, 0.641937255859375, 0.6749114990234375, 0.7078857421875, 0.7408599853515625, 0.773834228515625, 0.8068084716796875, 0.83978271484375, 0.8727569580078125, 0.905731201171875, 0.9387054443359375, 0.9716796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 11.0, 6.0, 7.0, 19.0, 12.0, 22.0, 36.0, 52.0, 97.0, 108.0, 148.0, 199.0, 319.0, 475.0, 671.0, 947.0, 1582.0, 2391.0, 4012.0, 7718.0, 16817.0, 48571.0, 310606.0, 3637294.0, 108453.0, 28110.0, 11180.0, 5499.0, 3089.0, 1892.0, 1243.0, 824.0, 533.0, 370.0, 310.0, 200.0, 134.0, 87.0, 70.0, 48.0, 39.0, 27.0, 18.0, 16.0, 10.0, 5.0, 1.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.33135986328125, -3.2135009765625, -3.09564208984375, -2.977783203125, -2.85992431640625, -2.7420654296875, -2.62420654296875, -2.50634765625, -2.38848876953125, -2.2706298828125, -2.15277099609375, -2.034912109375, -1.91705322265625, -1.7991943359375, -1.68133544921875, -1.5634765625, -1.44561767578125, -1.3277587890625, -1.20989990234375, -1.092041015625, -0.97418212890625, -0.8563232421875, -0.73846435546875, -0.62060546875, -0.50274658203125, -0.3848876953125, -0.26702880859375, -0.149169921875, -0.03131103515625, 0.0865478515625, 0.20440673828125, 0.322265625, 0.44012451171875, 0.5579833984375, 0.67584228515625, 0.793701171875, 0.91156005859375, 1.0294189453125, 1.14727783203125, 1.26513671875, 1.38299560546875, 1.5008544921875, 1.61871337890625, 1.736572265625, 1.85443115234375, 1.9722900390625, 2.09014892578125, 2.2080078125, 2.32586669921875, 2.4437255859375, 2.56158447265625, 2.679443359375, 2.79730224609375, 2.9151611328125, 3.03302001953125, 3.15087890625, 3.26873779296875, 3.3865966796875, 3.50445556640625, 3.622314453125, 3.74017333984375, 3.8580322265625, 3.97589111328125, 4.09375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 3.0, 4.0, 5.0, 17.0, 20.0, 33.0, 48.0, 82.0, 204.0, 2525.0, 761.0, 173.0, 66.0, 41.0, 25.0, 8.0, 11.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0282745361328125, -0.995025634765625, -0.9617767333984375, -0.92852783203125, -0.8952789306640625, -0.862030029296875, -0.8287811279296875, -0.7955322265625, -0.7622833251953125, -0.729034423828125, -0.6957855224609375, -0.66253662109375, -0.6292877197265625, -0.596038818359375, -0.5627899169921875, -0.529541015625, -0.4962921142578125, -0.463043212890625, -0.4297943115234375, -0.39654541015625, -0.3632965087890625, -0.330047607421875, -0.2967987060546875, -0.2635498046875, -0.2303009033203125, -0.197052001953125, -0.1638031005859375, -0.13055419921875, -0.0973052978515625, -0.064056396484375, -0.0308074951171875, 0.00244140625, 0.0356903076171875, 0.068939208984375, 0.1021881103515625, 0.13543701171875, 0.1686859130859375, 0.201934814453125, 0.2351837158203125, 0.2684326171875, 0.3016815185546875, 0.334930419921875, 0.3681793212890625, 0.40142822265625, 0.4346771240234375, 0.467926025390625, 0.5011749267578125, 0.534423828125, 0.5676727294921875, 0.600921630859375, 0.6341705322265625, 0.66741943359375, 0.7006683349609375, 0.733917236328125, 0.7671661376953125, 0.8004150390625, 0.8336639404296875, 0.866912841796875, 0.9001617431640625, 0.93341064453125, 0.9666595458984375, 0.999908447265625, 1.0331573486328125, 1.06640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 9.0, 28.0, 24.0, 47.0, 67.0, 82.0, 94.0, 124.0, 116.0, 98.0, 87.0, 72.0, 50.0, 41.0, 24.0, 11.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.908100605010986, -5.762397766113281, -5.616695404052734, -5.470992565155029, -5.325289726257324, -5.179587364196777, -5.033884525299072, -4.888181686401367, -4.74247932434082, -4.596776485443115, -4.451074123382568, -4.305371284484863, -4.159668445587158, -4.013966083526611, -3.8682632446289062, -3.7225606441497803, -3.576857805252075, -3.431155204772949, -3.285452365875244, -3.139749765396118, -2.994047164916992, -2.848344326019287, -2.702641725540161, -2.556939125061035, -2.41123628616333, -2.265533685684204, -2.119830846786499, -1.974128246307373, -1.828425645828247, -1.6827229261398315, -1.537020206451416, -1.39131760597229, -1.2456152439117432, -1.0999125242233276, -0.9542099237442017, -0.8085072040557861, -0.6628045439720154, -0.5171018838882446, -0.3713991641998291, -0.22569656372070312, -0.0799938440322876, 0.06570883095264435, 0.2114115059375763, 0.35711419582366943, 0.5028168559074402, 0.6485195159912109, 0.7942222356796265, 0.9399248361587524, 1.085627555847168, 1.2313302755355835, 1.3770328760147095, 1.522735595703125, 1.668438196182251, 1.8141409158706665, 1.959843635559082, 2.105546236038208, 2.251248836517334, 2.39695143699646, 2.542654275894165, 2.688356876373291, 2.834059476852417, 2.979762077331543, 3.125464916229248, 3.271167516708374, 3.416870355606079]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 5.0, 9.0, 12.0, 17.0, 15.0, 17.0, 22.0, 22.0, 25.0, 39.0, 31.0, 40.0, 42.0, 31.0, 48.0, 37.0, 42.0, 47.0, 45.0, 39.0, 41.0, 36.0, 33.0, 36.0, 38.0, 28.0, 36.0, 21.0, 20.0, 24.0, 13.0, 23.0, 11.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.091492176055908, -2.0252082347869873, -1.9589242935180664, -1.892640233039856, -1.826356291770935, -1.7600723505020142, -1.6937882900238037, -1.6275043487548828, -1.561220407485962, -1.494936466217041, -1.4286525249481201, -1.3623684644699097, -1.2960845232009888, -1.2298005819320679, -1.1635165214538574, -1.0972325801849365, -1.0309486389160156, -0.9646646976470947, -0.898380696773529, -0.8320966958999634, -0.7658127546310425, -0.6995288133621216, -0.6332448124885559, -0.5669608116149902, -0.5006768703460693, -0.43439289927482605, -0.36810892820358276, -0.3018249571323395, -0.2355409860610962, -0.1692570149898529, -0.10297304391860962, -0.03668907284736633, 0.029594898223876953, 0.09587886929512024, 0.16216284036636353, 0.2284468114376068, 0.2947307825088501, 0.3610147535800934, 0.42729872465133667, 0.49358269572257996, 0.5598666667938232, 0.6261506080627441, 0.6924346089363098, 0.7587186098098755, 0.8250025510787964, 0.8912864923477173, 0.957570493221283, 1.0238544940948486, 1.0901384353637695, 1.1564223766326904, 1.2227063179016113, 1.2889903783798218, 1.3552743196487427, 1.4215582609176636, 1.487842321395874, 1.554126262664795, 1.6204102039337158, 1.6866941452026367, 1.7529780864715576, 1.819262146949768, 1.885546088218689, 1.9518300294876099, 2.0181140899658203, 2.084398031234741, 2.150681972503662]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 11.0, 22.0, 20.0, 36.0, 50.0, 56.0, 80.0, 152.0, 196.0, 292.0, 416.0, 614.0, 882.0, 1437.0, 2347.0, 3807.0, 6543.0, 11223.0, 19991.0, 35392.0, 62593.0, 106021.0, 159207.0, 190370.0, 168950.0, 115348.0, 69321.0, 39810.0, 22100.0, 12557.0, 7291.0, 4189.0, 2537.0, 1636.0, 1020.0, 616.0, 443.0, 308.0, 207.0, 123.0, 82.0, 73.0, 45.0, 40.0, 30.0, 23.0, 13.0, 9.0, 5.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-2.03515625, -1.97271728515625, -1.9102783203125, -1.84783935546875, -1.785400390625, -1.72296142578125, -1.6605224609375, -1.59808349609375, -1.53564453125, -1.47320556640625, -1.4107666015625, -1.34832763671875, -1.285888671875, -1.22344970703125, -1.1610107421875, -1.09857177734375, -1.0361328125, -0.97369384765625, -0.9112548828125, -0.84881591796875, -0.786376953125, -0.72393798828125, -0.6614990234375, -0.59906005859375, -0.53662109375, -0.47418212890625, -0.4117431640625, -0.34930419921875, -0.286865234375, -0.22442626953125, -0.1619873046875, -0.09954833984375, -0.037109375, 0.02532958984375, 0.0877685546875, 0.15020751953125, 0.212646484375, 0.27508544921875, 0.3375244140625, 0.39996337890625, 0.46240234375, 0.52484130859375, 0.5872802734375, 0.64971923828125, 0.712158203125, 0.77459716796875, 0.8370361328125, 0.89947509765625, 0.9619140625, 1.02435302734375, 1.0867919921875, 1.14923095703125, 1.211669921875, 1.27410888671875, 1.3365478515625, 1.39898681640625, 1.46142578125, 1.52386474609375, 1.5863037109375, 1.64874267578125, 1.711181640625, 1.77362060546875, 1.8360595703125, 1.89849853515625, 1.9609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 12.0, 19.0, 24.0, 36.0, 42.0, 42.0, 44.0, 45.0, 56.0, 49.0, 54.0, 58.0, 52.0, 64.0, 54.0, 68.0, 32.0, 31.0, 25.0, 34.0, 23.0, 20.0, 12.0, 14.0, 10.0, 10.0, 10.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.232421875, -1.1984634399414062, -1.1645050048828125, -1.1305465698242188, -1.096588134765625, -1.0626296997070312, -1.0286712646484375, -0.9947128295898438, -0.96075439453125, -0.9267959594726562, -0.8928375244140625, -0.8588790893554688, -0.824920654296875, -0.7909622192382812, -0.7570037841796875, -0.7230453491210938, -0.6890869140625, -0.6551284790039062, -0.6211700439453125, -0.5872116088867188, -0.553253173828125, -0.5192947387695312, -0.4853363037109375, -0.45137786865234375, -0.41741943359375, -0.38346099853515625, -0.3495025634765625, -0.31554412841796875, -0.281585693359375, -0.24762725830078125, -0.2136688232421875, -0.17971038818359375, -0.145751953125, -0.11179351806640625, -0.0778350830078125, -0.04387664794921875, -0.009918212890625, 0.02404022216796875, 0.0579986572265625, 0.09195709228515625, 0.12591552734375, 0.15987396240234375, 0.1938323974609375, 0.22779083251953125, 0.261749267578125, 0.29570770263671875, 0.3296661376953125, 0.36362457275390625, 0.3975830078125, 0.43154144287109375, 0.4654998779296875, 0.49945831298828125, 0.533416748046875, 0.5673751831054688, 0.6013336181640625, 0.6352920532226562, 0.66925048828125, 0.7032089233398438, 0.7371673583984375, 0.7711257934570312, 0.805084228515625, 0.8390426635742188, 0.8730010986328125, 0.9069595336914062, 0.94091796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 4.0, 14.0, 17.0, 31.0, 32.0, 46.0, 57.0, 68.0, 117.0, 128.0, 172.0, 290.0, 351.0, 482.0, 729.0, 1333.0, 3850.0, 23571.0, 215127.0, 659666.0, 122507.0, 13759.0, 2708.0, 1134.0, 681.0, 446.0, 315.0, 223.0, 173.0, 124.0, 91.0, 65.0, 61.0, 51.0, 28.0, 22.0, 22.0, 14.0, 8.0, 9.0, 6.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.0423583984375, -4.858154296875, -4.6739501953125, -4.48974609375, -4.3055419921875, -4.121337890625, -3.9371337890625, -3.7529296875, -3.5687255859375, -3.384521484375, -3.2003173828125, -3.01611328125, -2.8319091796875, -2.647705078125, -2.4635009765625, -2.279296875, -2.0950927734375, -1.910888671875, -1.7266845703125, -1.54248046875, -1.3582763671875, -1.174072265625, -0.9898681640625, -0.8056640625, -0.6214599609375, -0.437255859375, -0.2530517578125, -0.06884765625, 0.1153564453125, 0.299560546875, 0.4837646484375, 0.66796875, 0.8521728515625, 1.036376953125, 1.2205810546875, 1.40478515625, 1.5889892578125, 1.773193359375, 1.9573974609375, 2.1416015625, 2.3258056640625, 2.510009765625, 2.6942138671875, 2.87841796875, 3.0626220703125, 3.246826171875, 3.4310302734375, 3.615234375, 3.7994384765625, 3.983642578125, 4.1678466796875, 4.35205078125, 4.5362548828125, 4.720458984375, 4.9046630859375, 5.0888671875, 5.2730712890625, 5.457275390625, 5.6414794921875, 5.82568359375, 6.0098876953125, 6.194091796875, 6.3782958984375, 6.5625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 8.0, 5.0, 9.0, 9.0, 13.0, 15.0, 12.0, 14.0, 20.0, 21.0, 26.0, 25.0, 34.0, 32.0, 33.0, 32.0, 47.0, 31.0, 42.0, 36.0, 40.0, 38.0, 45.0, 45.0, 50.0, 35.0, 38.0, 27.0, 29.0, 43.0, 24.0, 25.0, 11.0, 13.0, 13.0, 8.0, 14.0, 9.0, 6.0, 5.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.427734375, -3.3203125, -3.212890625, -3.10546875, -2.998046875, -2.890625, -2.783203125, -2.67578125, -2.568359375, -2.4609375, -2.353515625, -2.24609375, -2.138671875, -2.03125, -1.923828125, -1.81640625, -1.708984375, -1.6015625, -1.494140625, -1.38671875, -1.279296875, -1.171875, -1.064453125, -0.95703125, -0.849609375, -0.7421875, -0.634765625, -0.52734375, -0.419921875, -0.3125, -0.205078125, -0.09765625, 0.009765625, 0.1171875, 0.224609375, 0.33203125, 0.439453125, 0.546875, 0.654296875, 0.76171875, 0.869140625, 0.9765625, 1.083984375, 1.19140625, 1.298828125, 1.40625, 1.513671875, 1.62109375, 1.728515625, 1.8359375, 1.943359375, 2.05078125, 2.158203125, 2.265625, 2.373046875, 2.48046875, 2.587890625, 2.6953125, 2.802734375, 2.91015625, 3.017578125, 3.125, 3.232421875, 3.33984375, 3.447265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 6.0, 9.0, 7.0, 14.0, 14.0, 23.0, 28.0, 33.0, 63.0, 78.0, 148.0, 249.0, 484.0, 935.0, 2139.0, 6184.0, 23619.0, 109645.0, 469940.0, 339800.0, 71344.0, 15750.0, 4578.0, 1649.0, 767.0, 431.0, 205.0, 132.0, 84.0, 51.0, 39.0, 20.0, 17.0, 9.0, 16.0, 9.0, 15.0, 6.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.11328125, -2.046966552734375, -1.98065185546875, -1.914337158203125, -1.8480224609375, -1.781707763671875, -1.71539306640625, -1.649078369140625, -1.582763671875, -1.516448974609375, -1.45013427734375, -1.383819580078125, -1.3175048828125, -1.251190185546875, -1.18487548828125, -1.118560791015625, -1.05224609375, -0.985931396484375, -0.91961669921875, -0.853302001953125, -0.7869873046875, -0.720672607421875, -0.65435791015625, -0.588043212890625, -0.521728515625, -0.455413818359375, -0.38909912109375, -0.322784423828125, -0.2564697265625, -0.190155029296875, -0.12384033203125, -0.057525634765625, 0.0087890625, 0.075103759765625, 0.14141845703125, 0.207733154296875, 0.2740478515625, 0.340362548828125, 0.40667724609375, 0.472991943359375, 0.539306640625, 0.605621337890625, 0.67193603515625, 0.738250732421875, 0.8045654296875, 0.870880126953125, 0.93719482421875, 1.003509521484375, 1.06982421875, 1.136138916015625, 1.20245361328125, 1.268768310546875, 1.3350830078125, 1.401397705078125, 1.46771240234375, 1.534027099609375, 1.600341796875, 1.666656494140625, 1.73297119140625, 1.799285888671875, 1.8656005859375, 1.931915283203125, 1.99822998046875, 2.064544677734375, 2.130859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 5.0, 13.0, 10.0, 20.0, 18.0, 16.0, 29.0, 32.0, 48.0, 52.0, 67.0, 68.0, 97.0, 76.0, 64.0, 70.0, 58.0, 51.0, 42.0, 28.0, 32.0, 15.0, 26.0, 8.0, 11.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024330615997314453, -0.00023430772125720978, -0.00022530928254127502, -0.00021631084382534027, -0.00020731240510940552, -0.00019831396639347076, -0.000189315527677536, -0.00018031708896160126, -0.0001713186502456665, -0.00016232021152973175, -0.000153321772813797, -0.00014432333409786224, -0.0001353248953819275, -0.00012632645666599274, -0.00011732801795005798, -0.00010832957923412323, -9.933114051818848e-05, -9.033270180225372e-05, -8.133426308631897e-05, -7.233582437038422e-05, -6.333738565444946e-05, -5.433894693851471e-05, -4.5340508222579956e-05, -3.63420695066452e-05, -2.734363079071045e-05, -1.8345192074775696e-05, -9.346753358840942e-06, -3.4831464290618896e-07, 8.650124073028564e-06, 1.7648562788963318e-05, 2.664700150489807e-05, 3.5645440220832825e-05, 4.464387893676758e-05, 5.364231765270233e-05, 6.264075636863708e-05, 7.163919508457184e-05, 8.063763380050659e-05, 8.963607251644135e-05, 9.86345112323761e-05, 0.00010763294994831085, 0.0001166313886642456, 0.00012562982738018036, 0.0001346282660961151, 0.00014362670481204987, 0.00015262514352798462, 0.00016162358224391937, 0.00017062202095985413, 0.00017962045967578888, 0.00018861889839172363, 0.00019761733710765839, 0.00020661577582359314, 0.0002156142145395279, 0.00022461265325546265, 0.0002336110919713974, 0.00024260953068733215, 0.0002516079694032669, 0.00026060640811920166, 0.0002696048468351364, 0.00027860328555107117, 0.0002876017242670059, 0.0002966001629829407, 0.00030559860169887543, 0.0003145970404148102, 0.00032359547913074493, 0.0003325939178466797]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 11.0, 9.0, 16.0, 32.0, 46.0, 55.0, 109.0, 128.0, 213.0, 373.0, 690.0, 1421.0, 3668.0, 14514.0, 108972.0, 640992.0, 239670.0, 27998.0, 5651.0, 1909.0, 917.0, 463.0, 231.0, 140.0, 90.0, 64.0, 49.0, 32.0, 26.0, 12.0, 12.0, 9.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87890625, -2.78802490234375, -2.6971435546875, -2.60626220703125, -2.515380859375, -2.42449951171875, -2.3336181640625, -2.24273681640625, -2.15185546875, -2.06097412109375, -1.9700927734375, -1.87921142578125, -1.788330078125, -1.69744873046875, -1.6065673828125, -1.51568603515625, -1.4248046875, -1.33392333984375, -1.2430419921875, -1.15216064453125, -1.061279296875, -0.97039794921875, -0.8795166015625, -0.78863525390625, -0.69775390625, -0.60687255859375, -0.5159912109375, -0.42510986328125, -0.334228515625, -0.24334716796875, -0.1524658203125, -0.06158447265625, 0.029296875, 0.12017822265625, 0.2110595703125, 0.30194091796875, 0.392822265625, 0.48370361328125, 0.5745849609375, 0.66546630859375, 0.75634765625, 0.84722900390625, 0.9381103515625, 1.02899169921875, 1.119873046875, 1.21075439453125, 1.3016357421875, 1.39251708984375, 1.4833984375, 1.57427978515625, 1.6651611328125, 1.75604248046875, 1.846923828125, 1.93780517578125, 2.0286865234375, 2.11956787109375, 2.21044921875, 2.30133056640625, 2.3922119140625, 2.48309326171875, 2.573974609375, 2.66485595703125, 2.7557373046875, 2.84661865234375, 2.9375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 12.0, 10.0, 21.0, 26.0, 28.0, 42.0, 42.0, 54.0, 94.0, 89.0, 83.0, 91.0, 80.0, 66.0, 72.0, 39.0, 45.0, 30.0, 21.0, 15.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.955474853515625, -1.88555908203125, -1.815643310546875, -1.7457275390625, -1.675811767578125, -1.60589599609375, -1.535980224609375, -1.466064453125, -1.396148681640625, -1.32623291015625, -1.256317138671875, -1.1864013671875, -1.116485595703125, -1.04656982421875, -0.976654052734375, -0.90673828125, -0.836822509765625, -0.76690673828125, -0.696990966796875, -0.6270751953125, -0.557159423828125, -0.48724365234375, -0.417327880859375, -0.347412109375, -0.277496337890625, -0.20758056640625, -0.137664794921875, -0.0677490234375, 0.002166748046875, 0.07208251953125, 0.141998291015625, 0.2119140625, 0.281829833984375, 0.35174560546875, 0.421661376953125, 0.4915771484375, 0.561492919921875, 0.63140869140625, 0.701324462890625, 0.771240234375, 0.841156005859375, 0.91107177734375, 0.980987548828125, 1.0509033203125, 1.120819091796875, 1.19073486328125, 1.260650634765625, 1.33056640625, 1.400482177734375, 1.47039794921875, 1.540313720703125, 1.6102294921875, 1.680145263671875, 1.75006103515625, 1.819976806640625, 1.889892578125, 1.959808349609375, 2.02972412109375, 2.099639892578125, 2.1695556640625, 2.239471435546875, 2.30938720703125, 2.379302978515625, 2.44921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 15.0, 24.0, 69.0, 109.0, 187.0, 231.0, 155.0, 103.0, 59.0, 33.0, 9.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.95857238769531, -39.29039764404297, -37.62221908569336, -35.95404052734375, -34.285865783691406, -32.61769104003906, -30.949512481689453, -29.281335830688477, -27.6131591796875, -25.944982528686523, -24.276805877685547, -22.60862922668457, -20.940452575683594, -19.272275924682617, -17.60409927368164, -15.935922622680664, -14.267745971679688, -12.599569320678711, -10.931392669677734, -9.263216018676758, -7.595039367675781, -5.926862716674805, -4.258686065673828, -2.5905094146728516, -0.922332763671875, 0.7458438873291016, 2.414020538330078, 4.082197189331055, 5.750373840332031, 7.418550491333008, 9.086727142333984, 10.754903793334961, 12.423080444335938, 14.091257095336914, 15.75943374633789, 17.427610397338867, 19.095787048339844, 20.76396369934082, 22.432140350341797, 24.100317001342773, 25.76849365234375, 27.436670303344727, 29.104846954345703, 30.77302360534668, 32.441200256347656, 34.109375, 35.77755355834961, 37.44573211669922, 39.11390686035156, 40.782081604003906, 42.450260162353516, 44.118438720703125, 45.78661346435547, 47.45478820800781, 49.12296676635742, 50.79114532470703, 52.459320068359375, 54.12749481201172, 55.79567337036133, 57.46385192871094, 59.13202667236328, 60.800201416015625, 62.468379974365234, 64.13655853271484, 65.80473327636719]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 18.0, 9.0, 9.0, 19.0, 20.0, 18.0, 30.0, 25.0, 27.0, 47.0, 24.0, 39.0, 51.0, 48.0, 52.0, 45.0, 52.0, 51.0, 44.0, 45.0, 40.0, 37.0, 37.0, 34.0, 30.0, 23.0, 18.0, 20.0, 14.0, 18.0, 9.0, 9.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.52798843383789, -22.886945724487305, -22.24590301513672, -21.604860305786133, -20.963817596435547, -20.322772979736328, -19.681730270385742, -19.040687561035156, -18.39964485168457, -17.758602142333984, -17.1175594329834, -16.476516723632812, -15.83547306060791, -15.194430351257324, -14.553386688232422, -13.912343978881836, -13.27130126953125, -12.630258560180664, -11.989215850830078, -11.348172187805176, -10.70712947845459, -10.066086769104004, -9.425043106079102, -8.784000396728516, -8.14295768737793, -7.501914978027344, -6.8608717918396, -6.2198286056518555, -5.5787858963012695, -4.937743186950684, -4.2967000007629395, -3.6556568145751953, -3.0146141052246094, -2.3735711574554443, -1.7325282096862793, -1.0914852619171143, -0.4504423141479492, 0.19060063362121582, 0.8316435813903809, 1.472686767578125, 2.113729476928711, 2.754772424697876, 3.395815372467041, 4.036858558654785, 4.677901268005371, 5.318943977355957, 5.959987163543701, 6.601030349731445, 7.242073059082031, 7.883115768432617, 8.524158477783203, 9.165202140808105, 9.806244850158691, 10.447287559509277, 11.08833122253418, 11.729373931884766, 12.370416641235352, 13.011459350585938, 13.652502059936523, 14.293545722961426, 14.934588432312012, 15.575631141662598, 16.2166748046875, 16.857717514038086, 17.498760223388672]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 12.0, 11.0, 7.0, 11.0, 26.0, 46.0, 53.0, 101.0, 165.0, 230.0, 387.0, 813.0, 1509.0, 3364.0, 10120.0, 53889.0, 3962686.0, 134930.0, 16948.0, 4787.0, 1951.0, 910.0, 528.0, 303.0, 166.0, 97.0, 70.0, 54.0, 36.0, 26.0, 9.0, 8.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.13330078125, -7.8681640625, -7.60302734375, -7.337890625, -7.07275390625, -6.8076171875, -6.54248046875, -6.27734375, -6.01220703125, -5.7470703125, -5.48193359375, -5.216796875, -4.95166015625, -4.6865234375, -4.42138671875, -4.15625, -3.89111328125, -3.6259765625, -3.36083984375, -3.095703125, -2.83056640625, -2.5654296875, -2.30029296875, -2.03515625, -1.77001953125, -1.5048828125, -1.23974609375, -0.974609375, -0.70947265625, -0.4443359375, -0.17919921875, 0.0859375, 0.35107421875, 0.6162109375, 0.88134765625, 1.146484375, 1.41162109375, 1.6767578125, 1.94189453125, 2.20703125, 2.47216796875, 2.7373046875, 3.00244140625, 3.267578125, 3.53271484375, 3.7978515625, 4.06298828125, 4.328125, 4.59326171875, 4.8583984375, 5.12353515625, 5.388671875, 5.65380859375, 5.9189453125, 6.18408203125, 6.44921875, 6.71435546875, 6.9794921875, 7.24462890625, 7.509765625, 7.77490234375, 8.0400390625, 8.30517578125, 8.5703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 13.0, 11.0, 10.0, 24.0, 11.0, 26.0, 35.0, 32.0, 33.0, 53.0, 36.0, 50.0, 45.0, 82.0, 50.0, 61.0, 52.0, 58.0, 47.0, 35.0, 46.0, 34.0, 26.0, 26.0, 21.0, 16.0, 19.0, 6.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2490234375, -1.2156448364257812, -1.1822662353515625, -1.1488876342773438, -1.115509033203125, -1.0821304321289062, -1.0487518310546875, -1.0153732299804688, -0.98199462890625, -0.9486160278320312, -0.9152374267578125, -0.8818588256835938, -0.848480224609375, -0.8151016235351562, -0.7817230224609375, -0.7483444213867188, -0.7149658203125, -0.6815872192382812, -0.6482086181640625, -0.6148300170898438, -0.581451416015625, -0.5480728149414062, -0.5146942138671875, -0.48131561279296875, -0.44793701171875, -0.41455841064453125, -0.3811798095703125, -0.34780120849609375, -0.314422607421875, -0.28104400634765625, -0.2476654052734375, -0.21428680419921875, -0.180908203125, -0.14752960205078125, -0.1141510009765625, -0.08077239990234375, -0.047393798828125, -0.01401519775390625, 0.0193634033203125, 0.05274200439453125, 0.08612060546875, 0.11949920654296875, 0.1528778076171875, 0.18625640869140625, 0.219635009765625, 0.25301361083984375, 0.2863922119140625, 0.31977081298828125, 0.3531494140625, 0.38652801513671875, 0.4199066162109375, 0.45328521728515625, 0.486663818359375, 0.5200424194335938, 0.5534210205078125, 0.5867996215820312, 0.62017822265625, 0.6535568237304688, 0.6869354248046875, 0.7203140258789062, 0.753692626953125, 0.7870712280273438, 0.8204498291015625, 0.8538284301757812, 0.88720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 18.0, 21.0, 18.0, 34.0, 39.0, 48.0, 86.0, 114.0, 162.0, 216.0, 357.0, 542.0, 881.0, 1259.0, 2220.0, 3754.0, 7062.0, 14941.0, 40439.0, 186033.0, 3663301.0, 197990.0, 42090.0, 15557.0, 7305.0, 3749.0, 2169.0, 1283.0, 834.0, 563.0, 389.0, 231.0, 161.0, 106.0, 93.0, 58.0, 33.0, 40.0, 18.0, 15.0, 9.0, 13.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.611328125, -3.49298095703125, -3.3746337890625, -3.25628662109375, -3.137939453125, -3.01959228515625, -2.9012451171875, -2.78289794921875, -2.66455078125, -2.54620361328125, -2.4278564453125, -2.30950927734375, -2.191162109375, -2.07281494140625, -1.9544677734375, -1.83612060546875, -1.7177734375, -1.59942626953125, -1.4810791015625, -1.36273193359375, -1.244384765625, -1.12603759765625, -1.0076904296875, -0.88934326171875, -0.77099609375, -0.65264892578125, -0.5343017578125, -0.41595458984375, -0.297607421875, -0.17926025390625, -0.0609130859375, 0.05743408203125, 0.17578125, 0.29412841796875, 0.4124755859375, 0.53082275390625, 0.649169921875, 0.76751708984375, 0.8858642578125, 1.00421142578125, 1.12255859375, 1.24090576171875, 1.3592529296875, 1.47760009765625, 1.595947265625, 1.71429443359375, 1.8326416015625, 1.95098876953125, 2.0693359375, 2.18768310546875, 2.3060302734375, 2.42437744140625, 2.542724609375, 2.66107177734375, 2.7794189453125, 2.89776611328125, 3.01611328125, 3.13446044921875, 3.2528076171875, 3.37115478515625, 3.489501953125, 3.60784912109375, 3.7261962890625, 3.84454345703125, 3.962890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 13.0, 21.0, 29.0, 43.0, 53.0, 110.0, 273.0, 2450.0, 592.0, 186.0, 92.0, 52.0, 36.0, 24.0, 12.0, 11.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9242630004882812, -0.8910064697265625, -0.8577499389648438, -0.824493408203125, -0.7912368774414062, -0.7579803466796875, -0.7247238159179688, -0.69146728515625, -0.6582107543945312, -0.6249542236328125, -0.5916976928710938, -0.558441162109375, -0.5251846313476562, -0.4919281005859375, -0.45867156982421875, -0.4254150390625, -0.39215850830078125, -0.3589019775390625, -0.32564544677734375, -0.292388916015625, -0.25913238525390625, -0.2258758544921875, -0.19261932373046875, -0.15936279296875, -0.12610626220703125, -0.0928497314453125, -0.05959320068359375, -0.026336669921875, 0.00691986083984375, 0.0401763916015625, 0.07343292236328125, 0.106689453125, 0.13994598388671875, 0.1732025146484375, 0.20645904541015625, 0.239715576171875, 0.27297210693359375, 0.3062286376953125, 0.33948516845703125, 0.37274169921875, 0.40599822998046875, 0.4392547607421875, 0.47251129150390625, 0.505767822265625, 0.5390243530273438, 0.5722808837890625, 0.6055374145507812, 0.6387939453125, 0.6720504760742188, 0.7053070068359375, 0.7385635375976562, 0.771820068359375, 0.8050765991210938, 0.8383331298828125, 0.8715896606445312, 0.90484619140625, 0.9381027221679688, 0.9713592529296875, 1.0046157836914062, 1.037872314453125, 1.0711288452148438, 1.1043853759765625, 1.1376419067382812, 1.1708984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 12.0, 9.0, 13.0, 21.0, 32.0, 49.0, 66.0, 69.0, 89.0, 109.0, 99.0, 105.0, 99.0, 65.0, 51.0, 38.0, 23.0, 23.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.423069000244141, -4.252223014831543, -4.081377029418945, -3.910531520843506, -3.739685535430908, -3.5688395500183105, -3.397993803024292, -3.2271480560302734, -3.056302070617676, -2.885456085205078, -2.7146103382110596, -2.543764591217041, -2.3729186058044434, -2.2020726203918457, -2.031226873397827, -1.860381007194519, -1.689535140991211, -1.5186892747879028, -1.3478434085845947, -1.1769975423812866, -1.0061516761779785, -0.8353058099746704, -0.6644599437713623, -0.4936140775680542, -0.3227682113647461, -0.151922345161438, 0.018923521041870117, 0.18976938724517822, 0.36061525344848633, 0.5314611196517944, 0.7023069858551025, 0.8731528520584106, 1.0439987182617188, 1.2148445844650269, 1.385690450668335, 1.556536316871643, 1.7273821830749512, 1.8982280492782593, 2.0690739154815674, 2.239919662475586, 2.4107656478881836, 2.5816116333007812, 2.7524573802948, 2.9233031272888184, 3.094149112701416, 3.2649950981140137, 3.4358408451080322, 3.606686592102051, 3.7775325775146484, 3.948378562927246, 4.119224548339844, 4.290070056915283, 4.460916042327881, 4.6317620277404785, 4.802607536315918, 4.973453521728516, 5.144299507141113, 5.315145492553711, 5.485991477966309, 5.656836986541748, 5.827682971954346, 5.998528957366943, 6.169374465942383, 6.3402204513549805, 6.511066436767578]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 10.0, 5.0, 18.0, 8.0, 12.0, 8.0, 14.0, 32.0, 23.0, 29.0, 22.0, 22.0, 41.0, 42.0, 33.0, 36.0, 44.0, 38.0, 43.0, 51.0, 47.0, 35.0, 43.0, 26.0, 40.0, 28.0, 32.0, 33.0, 20.0, 25.0, 32.0, 25.0, 10.0, 11.0, 9.0, 12.0, 6.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4137866497039795, -2.3262338638305664, -2.2386810779571533, -2.1511282920837402, -2.063575506210327, -1.976022720336914, -1.8884700536727905, -1.8009172677993774, -1.7133644819259644, -1.6258116960525513, -1.5382589101791382, -1.4507062435150146, -1.3631534576416016, -1.2756006717681885, -1.1880478858947754, -1.1004951000213623, -1.0129423141479492, -0.9253895282745361, -0.837836742401123, -0.7502840161323547, -0.6627312302589417, -0.5751784443855286, -0.48762571811676025, -0.40007293224334717, -0.3125201463699341, -0.2249673753976822, -0.1374146044254303, -0.0498618483543396, 0.037690937519073486, 0.12524372339248657, 0.21279644966125488, 0.30034923553466797, 0.38790202140808105, 0.47545480728149414, 0.5630075931549072, 0.6505603194236755, 0.7381131052970886, 0.8256658911705017, 0.91321861743927, 1.000771403312683, 1.0883241891860962, 1.1758769750595093, 1.2634297609329224, 1.350982427597046, 1.438535213470459, 1.526087999343872, 1.6136407852172852, 1.7011935710906982, 1.7887463569641113, 1.8762991428375244, 1.9638519287109375, 2.0514047145843506, 2.1389575004577637, 2.2265102863311768, 2.31406307220459, 2.401615619659424, 2.489168643951416, 2.576721429824829, 2.664274215698242, 2.7518270015716553, 2.8393797874450684, 2.9269325733184814, 3.0144853591918945, 3.1020379066467285, 3.1895906925201416]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 8.0, 8.0, 10.0, 17.0, 15.0, 21.0, 36.0, 72.0, 74.0, 95.0, 177.0, 255.0, 348.0, 562.0, 795.0, 1287.0, 2115.0, 3371.0, 5910.0, 10692.0, 19213.0, 36375.0, 68102.0, 119240.0, 179148.0, 203712.0, 164462.0, 104237.0, 58008.0, 31052.0, 16749.0, 8971.0, 5136.0, 3012.0, 1861.0, 1141.0, 793.0, 456.0, 328.0, 204.0, 159.0, 101.0, 73.0, 50.0, 37.0, 24.0, 15.0, 9.0, 8.0, 7.0, 4.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7060546875, -1.65167236328125, -1.5972900390625, -1.54290771484375, -1.488525390625, -1.43414306640625, -1.3797607421875, -1.32537841796875, -1.27099609375, -1.21661376953125, -1.1622314453125, -1.10784912109375, -1.053466796875, -0.99908447265625, -0.9447021484375, -0.89031982421875, -0.8359375, -0.78155517578125, -0.7271728515625, -0.67279052734375, -0.618408203125, -0.56402587890625, -0.5096435546875, -0.45526123046875, -0.40087890625, -0.34649658203125, -0.2921142578125, -0.23773193359375, -0.183349609375, -0.12896728515625, -0.0745849609375, -0.02020263671875, 0.0341796875, 0.08856201171875, 0.1429443359375, 0.19732666015625, 0.251708984375, 0.30609130859375, 0.3604736328125, 0.41485595703125, 0.46923828125, 0.52362060546875, 0.5780029296875, 0.63238525390625, 0.686767578125, 0.74114990234375, 0.7955322265625, 0.84991455078125, 0.904296875, 0.95867919921875, 1.0130615234375, 1.06744384765625, 1.121826171875, 1.17620849609375, 1.2305908203125, 1.28497314453125, 1.33935546875, 1.39373779296875, 1.4481201171875, 1.50250244140625, 1.556884765625, 1.61126708984375, 1.6656494140625, 1.72003173828125, 1.7744140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 5.0, 11.0, 16.0, 16.0, 16.0, 26.0, 17.0, 30.0, 25.0, 28.0, 41.0, 43.0, 55.0, 45.0, 40.0, 55.0, 56.0, 57.0, 49.0, 42.0, 52.0, 44.0, 43.0, 29.0, 24.0, 17.0, 28.0, 15.0, 12.0, 13.0, 8.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.263671875, -1.2305068969726562, -1.1973419189453125, -1.1641769409179688, -1.131011962890625, -1.0978469848632812, -1.0646820068359375, -1.0315170288085938, -0.99835205078125, -0.9651870727539062, -0.9320220947265625, -0.8988571166992188, -0.865692138671875, -0.8325271606445312, -0.7993621826171875, -0.7661972045898438, -0.7330322265625, -0.6998672485351562, -0.6667022705078125, -0.6335372924804688, -0.600372314453125, -0.5672073364257812, -0.5340423583984375, -0.5008773803710938, -0.46771240234375, -0.43454742431640625, -0.4013824462890625, -0.36821746826171875, -0.335052490234375, -0.30188751220703125, -0.2687225341796875, -0.23555755615234375, -0.202392578125, -0.16922760009765625, -0.1360626220703125, -0.10289764404296875, -0.069732666015625, -0.03656768798828125, -0.0034027099609375, 0.02976226806640625, 0.06292724609375, 0.09609222412109375, 0.1292572021484375, 0.16242218017578125, 0.195587158203125, 0.22875213623046875, 0.2619171142578125, 0.29508209228515625, 0.3282470703125, 0.36141204833984375, 0.3945770263671875, 0.42774200439453125, 0.460906982421875, 0.49407196044921875, 0.5272369384765625, 0.5604019165039062, 0.59356689453125, 0.6267318725585938, 0.6598968505859375, 0.6930618286132812, 0.726226806640625, 0.7593917846679688, 0.7925567626953125, 0.8257217407226562, 0.85888671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 9.0, 14.0, 20.0, 27.0, 41.0, 63.0, 81.0, 104.0, 138.0, 229.0, 300.0, 410.0, 597.0, 960.0, 1627.0, 5708.0, 66551.0, 744790.0, 208564.0, 12524.0, 2377.0, 1090.0, 693.0, 447.0, 331.0, 251.0, 190.0, 128.0, 99.0, 58.0, 36.0, 29.0, 22.0, 12.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.510498046875, -6.29833984375, -6.086181640625, -5.8740234375, -5.661865234375, -5.44970703125, -5.237548828125, -5.025390625, -4.813232421875, -4.60107421875, -4.388916015625, -4.1767578125, -3.964599609375, -3.75244140625, -3.540283203125, -3.328125, -3.115966796875, -2.90380859375, -2.691650390625, -2.4794921875, -2.267333984375, -2.05517578125, -1.843017578125, -1.630859375, -1.418701171875, -1.20654296875, -0.994384765625, -0.7822265625, -0.570068359375, -0.35791015625, -0.145751953125, 0.06640625, 0.278564453125, 0.49072265625, 0.702880859375, 0.9150390625, 1.127197265625, 1.33935546875, 1.551513671875, 1.763671875, 1.975830078125, 2.18798828125, 2.400146484375, 2.6123046875, 2.824462890625, 3.03662109375, 3.248779296875, 3.4609375, 3.673095703125, 3.88525390625, 4.097412109375, 4.3095703125, 4.521728515625, 4.73388671875, 4.946044921875, 5.158203125, 5.370361328125, 5.58251953125, 5.794677734375, 6.0068359375, 6.218994140625, 6.43115234375, 6.643310546875, 6.85546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 1.0, 7.0, 10.0, 5.0, 3.0, 14.0, 16.0, 19.0, 23.0, 16.0, 21.0, 33.0, 27.0, 27.0, 29.0, 34.0, 35.0, 43.0, 50.0, 42.0, 35.0, 35.0, 50.0, 38.0, 42.0, 29.0, 36.0, 36.0, 32.0, 34.0, 28.0, 18.0, 14.0, 19.0, 12.0, 14.0, 10.0, 13.0, 10.0, 3.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.908203125, -3.787078857421875, -3.66595458984375, -3.544830322265625, -3.4237060546875, -3.302581787109375, -3.18145751953125, -3.060333251953125, -2.939208984375, -2.818084716796875, -2.69696044921875, -2.575836181640625, -2.4547119140625, -2.333587646484375, -2.21246337890625, -2.091339111328125, -1.97021484375, -1.849090576171875, -1.72796630859375, -1.606842041015625, -1.4857177734375, -1.364593505859375, -1.24346923828125, -1.122344970703125, -1.001220703125, -0.880096435546875, -0.75897216796875, -0.637847900390625, -0.5167236328125, -0.395599365234375, -0.27447509765625, -0.153350830078125, -0.0322265625, 0.088897705078125, 0.21002197265625, 0.331146240234375, 0.4522705078125, 0.573394775390625, 0.69451904296875, 0.815643310546875, 0.936767578125, 1.057891845703125, 1.17901611328125, 1.300140380859375, 1.4212646484375, 1.542388916015625, 1.66351318359375, 1.784637451171875, 1.90576171875, 2.026885986328125, 2.14801025390625, 2.269134521484375, 2.3902587890625, 2.511383056640625, 2.63250732421875, 2.753631591796875, 2.874755859375, 2.995880126953125, 3.11700439453125, 3.238128662109375, 3.3592529296875, 3.480377197265625, 3.60150146484375, 3.722625732421875, 3.84375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 0.0, 6.0, 7.0, 7.0, 7.0, 6.0, 15.0, 25.0, 23.0, 45.0, 56.0, 74.0, 127.0, 178.0, 320.0, 550.0, 1146.0, 3256.0, 16739.0, 177337.0, 743416.0, 90221.0, 10266.0, 2455.0, 991.0, 482.0, 284.0, 164.0, 98.0, 78.0, 48.0, 33.0, 29.0, 20.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.82421875, -2.731231689453125, -2.63824462890625, -2.545257568359375, -2.4522705078125, -2.359283447265625, -2.26629638671875, -2.173309326171875, -2.080322265625, -1.987335205078125, -1.89434814453125, -1.801361083984375, -1.7083740234375, -1.615386962890625, -1.52239990234375, -1.429412841796875, -1.33642578125, -1.243438720703125, -1.15045166015625, -1.057464599609375, -0.9644775390625, -0.871490478515625, -0.77850341796875, -0.685516357421875, -0.592529296875, -0.499542236328125, -0.40655517578125, -0.313568115234375, -0.2205810546875, -0.127593994140625, -0.03460693359375, 0.058380126953125, 0.1513671875, 0.244354248046875, 0.33734130859375, 0.430328369140625, 0.5233154296875, 0.616302490234375, 0.70928955078125, 0.802276611328125, 0.895263671875, 0.988250732421875, 1.08123779296875, 1.174224853515625, 1.2672119140625, 1.360198974609375, 1.45318603515625, 1.546173095703125, 1.63916015625, 1.732147216796875, 1.82513427734375, 1.918121337890625, 2.0111083984375, 2.104095458984375, 2.19708251953125, 2.290069580078125, 2.383056640625, 2.476043701171875, 2.56903076171875, 2.662017822265625, 2.7550048828125, 2.847991943359375, 2.94097900390625, 3.033966064453125, 3.126953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 14.0, 19.0, 29.0, 27.0, 63.0, 70.0, 81.0, 117.0, 113.0, 108.0, 96.0, 69.0, 49.0, 31.0, 30.0, 18.0, 13.0, 10.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003783702850341797, -0.0003658905625343323, -0.00035341084003448486, -0.00034093111753463745, -0.00032845139503479004, -0.0003159716725349426, -0.0003034919500350952, -0.0002910122275352478, -0.0002785325050354004, -0.000266052782535553, -0.00025357306003570557, -0.00024109333753585815, -0.00022861361503601074, -0.00021613389253616333, -0.00020365417003631592, -0.0001911744475364685, -0.0001786947250366211, -0.00016621500253677368, -0.00015373528003692627, -0.00014125555753707886, -0.00012877583503723145, -0.00011629611253738403, -0.00010381639003753662, -9.133666753768921e-05, -7.88569450378418e-05, -6.637722253799438e-05, -5.389750003814697e-05, -4.141777753829956e-05, -2.893805503845215e-05, -1.6458332538604736e-05, -3.978610038757324e-06, 8.501112461090088e-06, 2.09808349609375e-05, 3.346055746078491e-05, 4.5940279960632324e-05, 5.8420002460479736e-05, 7.089972496032715e-05, 8.337944746017456e-05, 9.585916996002197e-05, 0.00010833889245986938, 0.0001208186149597168, 0.0001332983374595642, 0.00014577805995941162, 0.00015825778245925903, 0.00017073750495910645, 0.00018321722745895386, 0.00019569694995880127, 0.00020817667245864868, 0.0002206563949584961, 0.0002331361174583435, 0.0002456158399581909, 0.00025809556245803833, 0.00027057528495788574, 0.00028305500745773315, 0.00029553472995758057, 0.000308014452457428, 0.0003204941749572754, 0.0003329738974571228, 0.0003454536199569702, 0.0003579333424568176, 0.00037041306495666504, 0.00038289278745651245, 0.00039537250995635986, 0.0004078522324562073, 0.0004203319549560547]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 11.0, 22.0, 28.0, 49.0, 86.0, 179.0, 343.0, 942.0, 3163.0, 45279.0, 950823.0, 42858.0, 3127.0, 914.0, 349.0, 158.0, 84.0, 55.0, 21.0, 9.0, 17.0, 11.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.07421875, -5.88134765625, -5.6884765625, -5.49560546875, -5.302734375, -5.10986328125, -4.9169921875, -4.72412109375, -4.53125, -4.33837890625, -4.1455078125, -3.95263671875, -3.759765625, -3.56689453125, -3.3740234375, -3.18115234375, -2.98828125, -2.79541015625, -2.6025390625, -2.40966796875, -2.216796875, -2.02392578125, -1.8310546875, -1.63818359375, -1.4453125, -1.25244140625, -1.0595703125, -0.86669921875, -0.673828125, -0.48095703125, -0.2880859375, -0.09521484375, 0.09765625, 0.29052734375, 0.4833984375, 0.67626953125, 0.869140625, 1.06201171875, 1.2548828125, 1.44775390625, 1.640625, 1.83349609375, 2.0263671875, 2.21923828125, 2.412109375, 2.60498046875, 2.7978515625, 2.99072265625, 3.18359375, 3.37646484375, 3.5693359375, 3.76220703125, 3.955078125, 4.14794921875, 4.3408203125, 4.53369140625, 4.7265625, 4.91943359375, 5.1123046875, 5.30517578125, 5.498046875, 5.69091796875, 5.8837890625, 6.07666015625, 6.26953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 12.0, 23.0, 41.0, 61.0, 91.0, 116.0, 132.0, 155.0, 111.0, 98.0, 42.0, 37.0, 26.0, 21.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.3128662109375, -2.207763671875, -2.1026611328125, -1.99755859375, -1.8924560546875, -1.787353515625, -1.6822509765625, -1.5771484375, -1.4720458984375, -1.366943359375, -1.2618408203125, -1.15673828125, -1.0516357421875, -0.946533203125, -0.8414306640625, -0.736328125, -0.6312255859375, -0.526123046875, -0.4210205078125, -0.31591796875, -0.2108154296875, -0.105712890625, -0.0006103515625, 0.1044921875, 0.2095947265625, 0.314697265625, 0.4197998046875, 0.52490234375, 0.6300048828125, 0.735107421875, 0.8402099609375, 0.9453125, 1.0504150390625, 1.155517578125, 1.2606201171875, 1.36572265625, 1.4708251953125, 1.575927734375, 1.6810302734375, 1.7861328125, 1.8912353515625, 1.996337890625, 2.1014404296875, 2.20654296875, 2.3116455078125, 2.416748046875, 2.5218505859375, 2.626953125, 2.7320556640625, 2.837158203125, 2.9422607421875, 3.04736328125, 3.1524658203125, 3.257568359375, 3.3626708984375, 3.4677734375, 3.5728759765625, 3.677978515625, 3.7830810546875, 3.88818359375, 3.9932861328125, 4.098388671875, 4.2034912109375, 4.30859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 7.0, 10.0, 16.0, 42.0, 100.0, 154.0, 216.0, 189.0, 146.0, 77.0, 28.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.998624801635742, -30.387989044189453, -28.777353286743164, -27.166717529296875, -25.556081771850586, -23.945446014404297, -22.334808349609375, -20.72417449951172, -19.113536834716797, -17.502901077270508, -15.892265319824219, -14.28162956237793, -12.67099380493164, -11.060357093811035, -9.449721336364746, -7.839085578918457, -6.228450775146484, -4.617815017700195, -3.007179021835327, -1.396543025970459, 0.21409273147583008, 1.8247289657592773, 3.4353647232055664, 5.0460004806518555, 6.6566362380981445, 8.267271995544434, 9.877907752990723, 11.488544464111328, 13.099180221557617, 14.709815979003906, 16.320451736450195, 17.931087493896484, 19.54172134399414, 21.15235710144043, 22.76299285888672, 24.373628616333008, 25.984264373779297, 27.59490203857422, 29.205535888671875, 30.816173553466797, 32.42680740356445, 34.037445068359375, 35.64807891845703, 37.25871658325195, 38.86935043334961, 40.47998809814453, 42.09062194824219, 43.70125961303711, 45.31189727783203, 46.92253494262695, 48.53316879272461, 50.14380645751953, 51.75444030761719, 53.36507797241211, 54.975711822509766, 56.58634948730469, 58.196983337402344, 59.807621002197266, 61.41825485229492, 63.028892517089844, 64.6395263671875, 66.25016021728516, 67.86080169677734, 69.471435546875, 71.08206939697266]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 9.0, 4.0, 2.0, 8.0, 10.0, 8.0, 6.0, 16.0, 19.0, 17.0, 25.0, 29.0, 30.0, 33.0, 27.0, 41.0, 51.0, 45.0, 37.0, 46.0, 44.0, 44.0, 43.0, 47.0, 52.0, 43.0, 30.0, 33.0, 37.0, 20.0, 16.0, 23.0, 12.0, 16.0, 19.0, 12.0, 12.0, 5.0, 6.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-21.228343963623047, -20.62083625793457, -20.013328552246094, -19.405818939208984, -18.798311233520508, -18.19080352783203, -17.583295822143555, -16.975788116455078, -16.36827850341797, -15.760770797729492, -15.1532621383667, -14.545754432678223, -13.93824577331543, -13.330738067626953, -12.723230361938477, -12.115721702575684, -11.508213996887207, -10.90070629119873, -10.293197631835938, -9.685689926147461, -9.078181266784668, -8.470673561096191, -7.863165378570557, -7.255657196044922, -6.648149013519287, -6.040640830993652, -5.433132648468018, -4.825624465942383, -4.218116760253906, -3.6106083393096924, -3.0031003952026367, -2.395592212677002, -1.7880840301513672, -1.1805758476257324, -0.5730677843093872, 0.03444027900695801, 0.6419484615325928, 1.2494566440582275, 1.8569645881652832, 2.464472770690918, 3.0719809532165527, 3.6794891357421875, 4.286997318267822, 4.894505500793457, 5.502013206481934, 6.109521865844727, 6.717029571533203, 7.324537754058838, 7.932045936584473, 8.53955364227295, 9.147062301635742, 9.754570007324219, 10.362078666687012, 10.969586372375488, 11.577095031738281, 12.184602737426758, 12.792110443115234, 13.399618148803711, 14.007126808166504, 14.61463451385498, 15.222143173217773, 15.82965087890625, 16.437158584594727, 17.044666290283203, 17.652175903320312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 9.0, 5.0, 14.0, 13.0, 25.0, 31.0, 58.0, 54.0, 74.0, 113.0, 187.0, 226.0, 365.0, 563.0, 837.0, 1380.0, 2568.0, 6388.0, 26817.0, 4045600.0, 88670.0, 11486.0, 3883.0, 1722.0, 1040.0, 667.0, 442.0, 325.0, 208.0, 131.0, 92.0, 71.0, 53.0, 39.0, 31.0, 17.0, 21.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.09375, -7.86077880859375, -7.6278076171875, -7.39483642578125, -7.161865234375, -6.92889404296875, -6.6959228515625, -6.46295166015625, -6.22998046875, -5.99700927734375, -5.7640380859375, -5.53106689453125, -5.298095703125, -5.06512451171875, -4.8321533203125, -4.59918212890625, -4.3662109375, -4.13323974609375, -3.9002685546875, -3.66729736328125, -3.434326171875, -3.20135498046875, -2.9683837890625, -2.73541259765625, -2.50244140625, -2.26947021484375, -2.0364990234375, -1.80352783203125, -1.570556640625, -1.33758544921875, -1.1046142578125, -0.87164306640625, -0.638671875, -0.40570068359375, -0.1727294921875, 0.06024169921875, 0.293212890625, 0.52618408203125, 0.7591552734375, 0.99212646484375, 1.22509765625, 1.45806884765625, 1.6910400390625, 1.92401123046875, 2.156982421875, 2.38995361328125, 2.6229248046875, 2.85589599609375, 3.0888671875, 3.32183837890625, 3.5548095703125, 3.78778076171875, 4.020751953125, 4.25372314453125, 4.4866943359375, 4.71966552734375, 4.95263671875, 5.18560791015625, 5.4185791015625, 5.65155029296875, 5.884521484375, 6.11749267578125, 6.3504638671875, 6.58343505859375, 6.81640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 5.0, 9.0, 15.0, 8.0, 16.0, 17.0, 21.0, 27.0, 26.0, 36.0, 38.0, 44.0, 45.0, 46.0, 52.0, 53.0, 43.0, 52.0, 52.0, 49.0, 39.0, 55.0, 40.0, 31.0, 25.0, 30.0, 25.0, 18.0, 21.0, 5.0, 12.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1767578125, -1.141571044921875, -1.10638427734375, -1.071197509765625, -1.0360107421875, -1.000823974609375, -0.96563720703125, -0.930450439453125, -0.895263671875, -0.860076904296875, -0.82489013671875, -0.789703369140625, -0.7545166015625, -0.719329833984375, -0.68414306640625, -0.648956298828125, -0.61376953125, -0.578582763671875, -0.54339599609375, -0.508209228515625, -0.4730224609375, -0.437835693359375, -0.40264892578125, -0.367462158203125, -0.332275390625, -0.297088623046875, -0.26190185546875, -0.226715087890625, -0.1915283203125, -0.156341552734375, -0.12115478515625, -0.085968017578125, -0.05078125, -0.015594482421875, 0.01959228515625, 0.054779052734375, 0.0899658203125, 0.125152587890625, 0.16033935546875, 0.195526123046875, 0.230712890625, 0.265899658203125, 0.30108642578125, 0.336273193359375, 0.3714599609375, 0.406646728515625, 0.44183349609375, 0.477020263671875, 0.51220703125, 0.547393798828125, 0.58258056640625, 0.617767333984375, 0.6529541015625, 0.688140869140625, 0.72332763671875, 0.758514404296875, 0.793701171875, 0.828887939453125, 0.86407470703125, 0.899261474609375, 0.9344482421875, 0.969635009765625, 1.00482177734375, 1.040008544921875, 1.0751953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 15.0, 19.0, 34.0, 44.0, 46.0, 64.0, 108.0, 124.0, 202.0, 270.0, 477.0, 656.0, 997.0, 1626.0, 2714.0, 4854.0, 10669.0, 34460.0, 3882871.0, 212630.0, 22695.0, 8196.0, 4106.0, 2282.0, 1339.0, 912.0, 561.0, 410.0, 282.0, 188.0, 126.0, 91.0, 50.0, 41.0, 34.0, 16.0, 19.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.15625, -5.00830078125, -4.8603515625, -4.71240234375, -4.564453125, -4.41650390625, -4.2685546875, -4.12060546875, -3.97265625, -3.82470703125, -3.6767578125, -3.52880859375, -3.380859375, -3.23291015625, -3.0849609375, -2.93701171875, -2.7890625, -2.64111328125, -2.4931640625, -2.34521484375, -2.197265625, -2.04931640625, -1.9013671875, -1.75341796875, -1.60546875, -1.45751953125, -1.3095703125, -1.16162109375, -1.013671875, -0.86572265625, -0.7177734375, -0.56982421875, -0.421875, -0.27392578125, -0.1259765625, 0.02197265625, 0.169921875, 0.31787109375, 0.4658203125, 0.61376953125, 0.76171875, 0.90966796875, 1.0576171875, 1.20556640625, 1.353515625, 1.50146484375, 1.6494140625, 1.79736328125, 1.9453125, 2.09326171875, 2.2412109375, 2.38916015625, 2.537109375, 2.68505859375, 2.8330078125, 2.98095703125, 3.12890625, 3.27685546875, 3.4248046875, 3.57275390625, 3.720703125, 3.86865234375, 4.0166015625, 4.16455078125, 4.3125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 22.0, 64.0, 146.0, 3379.0, 250.0, 63.0, 26.0, 20.0, 8.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1446990966796875, -1.109710693359375, -1.0747222900390625, -1.03973388671875, -1.0047454833984375, -0.969757080078125, -0.9347686767578125, -0.8997802734375, -0.8647918701171875, -0.829803466796875, -0.7948150634765625, -0.75982666015625, -0.7248382568359375, -0.689849853515625, -0.6548614501953125, -0.619873046875, -0.5848846435546875, -0.549896240234375, -0.5149078369140625, -0.47991943359375, -0.4449310302734375, -0.409942626953125, -0.3749542236328125, -0.3399658203125, -0.3049774169921875, -0.269989013671875, -0.2350006103515625, -0.20001220703125, -0.1650238037109375, -0.130035400390625, -0.0950469970703125, -0.06005859375, -0.0250701904296875, 0.009918212890625, 0.0449066162109375, 0.07989501953125, 0.1148834228515625, 0.149871826171875, 0.1848602294921875, 0.2198486328125, 0.2548370361328125, 0.289825439453125, 0.3248138427734375, 0.35980224609375, 0.3947906494140625, 0.429779052734375, 0.4647674560546875, 0.499755859375, 0.5347442626953125, 0.569732666015625, 0.6047210693359375, 0.63970947265625, 0.6746978759765625, 0.709686279296875, 0.7446746826171875, 0.7796630859375, 0.8146514892578125, 0.849639892578125, 0.8846282958984375, 0.91961669921875, 0.9546051025390625, 0.989593505859375, 1.0245819091796875, 1.0595703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 12.0, 26.0, 40.0, 79.0, 120.0, 151.0, 189.0, 171.0, 89.0, 63.0, 31.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-11.44223403930664, -11.214584350585938, -10.986934661865234, -10.759284973144531, -10.531635284423828, -10.303985595703125, -10.076335906982422, -9.848686218261719, -9.621036529541016, -9.393386840820312, -9.16573715209961, -8.938087463378906, -8.710437774658203, -8.4827880859375, -8.255138397216797, -8.027488708496094, -7.799838066101074, -7.572188377380371, -7.344538688659668, -7.116888999938965, -6.889239311218262, -6.661589622497559, -6.433939456939697, -6.206289768218994, -5.978640079498291, -5.750990390777588, -5.523340702056885, -5.295691013336182, -5.06804084777832, -4.840391159057617, -4.612741470336914, -4.385091781616211, -4.157442092895508, -3.9297924041748047, -3.7021427154541016, -3.4744927883148193, -3.246843099594116, -3.019193410873413, -2.791543483734131, -2.5638937950134277, -2.3362441062927246, -2.1085944175720215, -1.8809446096420288, -1.6532948017120361, -1.425645112991333, -1.1979954242706299, -0.9703456163406372, -0.7426958084106445, -0.5150461196899414, -0.2873963713645935, -0.059746623039245605, 0.1679031252861023, 0.3955528736114502, 0.6232025623321533, 0.850852370262146, 1.0785021781921387, 1.3061518669128418, 1.533801555633545, 1.7614513635635376, 1.9891011714935303, 2.2167508602142334, 2.4444005489349365, 2.6720504760742188, 2.899700164794922, 3.127349853515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 1.0, 5.0, 6.0, 9.0, 9.0, 6.0, 17.0, 14.0, 13.0, 20.0, 21.0, 33.0, 32.0, 29.0, 28.0, 29.0, 39.0, 46.0, 62.0, 46.0, 55.0, 41.0, 51.0, 41.0, 33.0, 40.0, 29.0, 33.0, 30.0, 27.0, 29.0, 22.0, 19.0, 14.0, 12.0, 14.0, 11.0, 10.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2060015201568604, -2.131774425506592, -2.0575475692749023, -1.9833204746246338, -1.9090934991836548, -1.8348665237426758, -1.7606394290924072, -1.6864124536514282, -1.6121854782104492, -1.5379585027694702, -1.4637315273284912, -1.3895044326782227, -1.3152774572372437, -1.2410504817962646, -1.166823387145996, -1.092596411705017, -1.018369436264038, -0.9441424608230591, -0.8699154257774353, -0.7956883907318115, -0.7214614152908325, -0.6472344398498535, -0.5730074048042297, -0.49878036975860596, -0.42455339431762695, -0.35032638907432556, -0.27609938383102417, -0.20187237858772278, -0.1276453733444214, -0.053418368101119995, 0.020808637142181396, 0.09503567218780518, 0.16926240921020508, 0.24348941445350647, 0.31771641969680786, 0.39194342494010925, 0.46617043018341064, 0.5403974056243896, 0.6146244406700134, 0.6888514757156372, 0.7630784511566162, 0.8373054265975952, 0.911532461643219, 0.9857594966888428, 1.0599864721298218, 1.1342134475708008, 1.2084405422210693, 1.2826675176620483, 1.3568944931030273, 1.4311214685440063, 1.5053484439849854, 1.579575538635254, 1.653802514076233, 1.728029489517212, 1.8022565841674805, 1.8764835596084595, 1.9507105350494385, 2.024937629699707, 2.0991644859313965, 2.173391580581665, 2.2476186752319336, 2.321845531463623, 2.3960726261138916, 2.47029972076416, 2.5445265769958496]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 7.0, 1.0, 2.0, 6.0, 9.0, 7.0, 7.0, 10.0, 24.0, 28.0, 41.0, 83.0, 123.0, 192.0, 434.0, 1030.0, 3065.0, 11161.0, 47959.0, 222451.0, 508720.0, 196301.0, 42307.0, 9876.0, 2818.0, 969.0, 408.0, 206.0, 101.0, 73.0, 30.0, 30.0, 19.0, 13.0, 18.0, 13.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.798248291015625, -4.65899658203125, -4.519744873046875, -4.3804931640625, -4.241241455078125, -4.10198974609375, -3.962738037109375, -3.823486328125, -3.684234619140625, -3.54498291015625, -3.405731201171875, -3.2664794921875, -3.127227783203125, -2.98797607421875, -2.848724365234375, -2.70947265625, -2.570220947265625, -2.43096923828125, -2.291717529296875, -2.1524658203125, -2.013214111328125, -1.87396240234375, -1.734710693359375, -1.595458984375, -1.456207275390625, -1.31695556640625, -1.177703857421875, -1.0384521484375, -0.899200439453125, -0.75994873046875, -0.620697021484375, -0.4814453125, -0.342193603515625, -0.20294189453125, -0.063690185546875, 0.0755615234375, 0.214813232421875, 0.35406494140625, 0.493316650390625, 0.632568359375, 0.771820068359375, 0.91107177734375, 1.050323486328125, 1.1895751953125, 1.328826904296875, 1.46807861328125, 1.607330322265625, 1.74658203125, 1.885833740234375, 2.02508544921875, 2.164337158203125, 2.3035888671875, 2.442840576171875, 2.58209228515625, 2.721343994140625, 2.860595703125, 2.999847412109375, 3.13909912109375, 3.278350830078125, 3.4176025390625, 3.556854248046875, 3.69610595703125, 3.835357666015625, 3.974609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 8.0, 7.0, 10.0, 9.0, 14.0, 15.0, 25.0, 22.0, 26.0, 33.0, 34.0, 32.0, 33.0, 41.0, 50.0, 46.0, 42.0, 40.0, 38.0, 40.0, 50.0, 51.0, 43.0, 39.0, 37.0, 28.0, 30.0, 22.0, 16.0, 18.0, 16.0, 17.0, 16.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.080352783203125, -1.04644775390625, -1.012542724609375, -0.9786376953125, -0.944732666015625, -0.91082763671875, -0.876922607421875, -0.843017578125, -0.809112548828125, -0.77520751953125, -0.741302490234375, -0.7073974609375, -0.673492431640625, -0.63958740234375, -0.605682373046875, -0.57177734375, -0.537872314453125, -0.50396728515625, -0.470062255859375, -0.4361572265625, -0.402252197265625, -0.36834716796875, -0.334442138671875, -0.300537109375, -0.266632080078125, -0.23272705078125, -0.198822021484375, -0.1649169921875, -0.131011962890625, -0.09710693359375, -0.063201904296875, -0.029296875, 0.004608154296875, 0.03851318359375, 0.072418212890625, 0.1063232421875, 0.140228271484375, 0.17413330078125, 0.208038330078125, 0.241943359375, 0.275848388671875, 0.30975341796875, 0.343658447265625, 0.3775634765625, 0.411468505859375, 0.44537353515625, 0.479278564453125, 0.51318359375, 0.547088623046875, 0.58099365234375, 0.614898681640625, 0.6488037109375, 0.682708740234375, 0.71661376953125, 0.750518798828125, 0.784423828125, 0.818328857421875, 0.85223388671875, 0.886138916015625, 0.9200439453125, 0.953948974609375, 0.98785400390625, 1.021759033203125, 1.0556640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 6.0, 9.0, 7.0, 11.0, 29.0, 43.0, 57.0, 79.0, 146.0, 228.0, 352.0, 619.0, 999.0, 2454.0, 11699.0, 188197.0, 782042.0, 52263.0, 5564.0, 1670.0, 787.0, 481.0, 304.0, 198.0, 109.0, 80.0, 52.0, 25.0, 22.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.875, -8.64324951171875, -8.4114990234375, -8.17974853515625, -7.947998046875, -7.71624755859375, -7.4844970703125, -7.25274658203125, -7.02099609375, -6.78924560546875, -6.5574951171875, -6.32574462890625, -6.093994140625, -5.86224365234375, -5.6304931640625, -5.39874267578125, -5.1669921875, -4.93524169921875, -4.7034912109375, -4.47174072265625, -4.239990234375, -4.00823974609375, -3.7764892578125, -3.54473876953125, -3.31298828125, -3.08123779296875, -2.8494873046875, -2.61773681640625, -2.385986328125, -2.15423583984375, -1.9224853515625, -1.69073486328125, -1.458984375, -1.22723388671875, -0.9954833984375, -0.76373291015625, -0.531982421875, -0.30023193359375, -0.0684814453125, 0.16326904296875, 0.39501953125, 0.62677001953125, 0.8585205078125, 1.09027099609375, 1.322021484375, 1.55377197265625, 1.7855224609375, 2.01727294921875, 2.2490234375, 2.48077392578125, 2.7125244140625, 2.94427490234375, 3.176025390625, 3.40777587890625, 3.6395263671875, 3.87127685546875, 4.10302734375, 4.33477783203125, 4.5665283203125, 4.79827880859375, 5.030029296875, 5.26177978515625, 5.4935302734375, 5.72528076171875, 5.95703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 9.0, 4.0, 10.0, 2.0, 9.0, 8.0, 9.0, 13.0, 23.0, 22.0, 24.0, 35.0, 39.0, 37.0, 40.0, 35.0, 43.0, 52.0, 38.0, 49.0, 49.0, 49.0, 56.0, 38.0, 39.0, 41.0, 32.0, 32.0, 29.0, 21.0, 27.0, 20.0, 17.0, 12.0, 9.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21875, -5.05987548828125, -4.9010009765625, -4.74212646484375, -4.583251953125, -4.42437744140625, -4.2655029296875, -4.10662841796875, -3.94775390625, -3.78887939453125, -3.6300048828125, -3.47113037109375, -3.312255859375, -3.15338134765625, -2.9945068359375, -2.83563232421875, -2.6767578125, -2.51788330078125, -2.3590087890625, -2.20013427734375, -2.041259765625, -1.88238525390625, -1.7235107421875, -1.56463623046875, -1.40576171875, -1.24688720703125, -1.0880126953125, -0.92913818359375, -0.770263671875, -0.61138916015625, -0.4525146484375, -0.29364013671875, -0.134765625, 0.02410888671875, 0.1829833984375, 0.34185791015625, 0.500732421875, 0.65960693359375, 0.8184814453125, 0.97735595703125, 1.13623046875, 1.29510498046875, 1.4539794921875, 1.61285400390625, 1.771728515625, 1.93060302734375, 2.0894775390625, 2.24835205078125, 2.4072265625, 2.56610107421875, 2.7249755859375, 2.88385009765625, 3.042724609375, 3.20159912109375, 3.3604736328125, 3.51934814453125, 3.67822265625, 3.83709716796875, 3.9959716796875, 4.15484619140625, 4.313720703125, 4.47259521484375, 4.6314697265625, 4.79034423828125, 4.94921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 19.0, 24.0, 20.0, 24.0, 37.0, 44.0, 75.0, 102.0, 156.0, 287.0, 580.0, 1765.0, 9214.0, 125510.0, 847694.0, 54967.0, 5576.0, 1222.0, 491.0, 240.0, 136.0, 81.0, 74.0, 53.0, 23.0, 26.0, 20.0, 22.0, 8.0, 5.0, 9.0, 8.0, 4.0, 7.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.3262939453125, -4.183837890625, -4.0413818359375, -3.89892578125, -3.7564697265625, -3.614013671875, -3.4715576171875, -3.3291015625, -3.1866455078125, -3.044189453125, -2.9017333984375, -2.75927734375, -2.6168212890625, -2.474365234375, -2.3319091796875, -2.189453125, -2.0469970703125, -1.904541015625, -1.7620849609375, -1.61962890625, -1.4771728515625, -1.334716796875, -1.1922607421875, -1.0498046875, -0.9073486328125, -0.764892578125, -0.6224365234375, -0.47998046875, -0.3375244140625, -0.195068359375, -0.0526123046875, 0.08984375, 0.2322998046875, 0.374755859375, 0.5172119140625, 0.65966796875, 0.8021240234375, 0.944580078125, 1.0870361328125, 1.2294921875, 1.3719482421875, 1.514404296875, 1.6568603515625, 1.79931640625, 1.9417724609375, 2.084228515625, 2.2266845703125, 2.369140625, 2.5115966796875, 2.654052734375, 2.7965087890625, 2.93896484375, 3.0814208984375, 3.223876953125, 3.3663330078125, 3.5087890625, 3.6512451171875, 3.793701171875, 3.9361572265625, 4.07861328125, 4.2210693359375, 4.363525390625, 4.5059814453125, 4.6484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 3.0, 6.0, 9.0, 8.0, 26.0, 26.0, 28.0, 39.0, 47.0, 64.0, 83.0, 123.0, 123.0, 108.0, 74.0, 60.0, 37.0, 27.0, 23.0, 14.0, 13.0, 13.0, 10.0, 8.0, 6.0, 3.0, 1.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004513263702392578, -0.0004377886652946472, -0.0004242509603500366, -0.000410713255405426, -0.00039717555046081543, -0.00038363784551620483, -0.00037010014057159424, -0.00035656243562698364, -0.00034302473068237305, -0.00032948702573776245, -0.00031594932079315186, -0.00030241161584854126, -0.00028887391090393066, -0.00027533620595932007, -0.00026179850101470947, -0.0002482607960700989, -0.00023472309112548828, -0.00022118538618087769, -0.0002076476812362671, -0.0001941099762916565, -0.0001805722713470459, -0.0001670345664024353, -0.0001534968614578247, -0.0001399591565132141, -0.00012642145156860352, -0.00011288374662399292, -9.934604167938232e-05, -8.580833673477173e-05, -7.227063179016113e-05, -5.873292684555054e-05, -4.519522190093994e-05, -3.1657516956329346e-05, -1.811981201171875e-05, -4.582107067108154e-06, 8.955597877502441e-06, 2.2493302822113037e-05, 3.603100776672363e-05, 4.956871271133423e-05, 6.310641765594482e-05, 7.664412260055542e-05, 9.018182754516602e-05, 0.00010371953248977661, 0.00011725723743438721, 0.0001307949423789978, 0.0001443326473236084, 0.000157870352268219, 0.0001714080572128296, 0.00018494576215744019, 0.00019848346710205078, 0.00021202117204666138, 0.00022555887699127197, 0.00023909658193588257, 0.00025263428688049316, 0.00026617199182510376, 0.00027970969676971436, 0.00029324740171432495, 0.00030678510665893555, 0.00032032281160354614, 0.00033386051654815674, 0.00034739822149276733, 0.00036093592643737793, 0.0003744736313819885, 0.0003880113363265991, 0.0004015490412712097, 0.0004150867462158203]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 9.0, 11.0, 14.0, 26.0, 37.0, 46.0, 74.0, 129.0, 177.0, 297.0, 501.0, 1012.0, 2383.0, 7918.0, 46797.0, 561104.0, 383969.0, 33690.0, 6215.0, 1981.0, 891.0, 521.0, 243.0, 157.0, 104.0, 76.0, 38.0, 40.0, 17.0, 9.0, 18.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.2545166015625, -3.145751953125, -3.0369873046875, -2.92822265625, -2.8194580078125, -2.710693359375, -2.6019287109375, -2.4931640625, -2.3843994140625, -2.275634765625, -2.1668701171875, -2.05810546875, -1.9493408203125, -1.840576171875, -1.7318115234375, -1.623046875, -1.5142822265625, -1.405517578125, -1.2967529296875, -1.18798828125, -1.0792236328125, -0.970458984375, -0.8616943359375, -0.7529296875, -0.6441650390625, -0.535400390625, -0.4266357421875, -0.31787109375, -0.2091064453125, -0.100341796875, 0.0084228515625, 0.1171875, 0.2259521484375, 0.334716796875, 0.4434814453125, 0.55224609375, 0.6610107421875, 0.769775390625, 0.8785400390625, 0.9873046875, 1.0960693359375, 1.204833984375, 1.3135986328125, 1.42236328125, 1.5311279296875, 1.639892578125, 1.7486572265625, 1.857421875, 1.9661865234375, 2.074951171875, 2.1837158203125, 2.29248046875, 2.4012451171875, 2.510009765625, 2.6187744140625, 2.7275390625, 2.8363037109375, 2.945068359375, 3.0538330078125, 3.16259765625, 3.2713623046875, 3.380126953125, 3.4888916015625, 3.59765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 14.0, 24.0, 26.0, 32.0, 52.0, 60.0, 112.0, 120.0, 104.0, 101.0, 88.0, 70.0, 47.0, 33.0, 31.0, 15.0, 9.0, 10.0, 6.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -1.964080810546875, -1.87152099609375, -1.778961181640625, -1.6864013671875, -1.593841552734375, -1.50128173828125, -1.408721923828125, -1.316162109375, -1.223602294921875, -1.13104248046875, -1.038482666015625, -0.9459228515625, -0.853363037109375, -0.76080322265625, -0.668243408203125, -0.57568359375, -0.483123779296875, -0.39056396484375, -0.298004150390625, -0.2054443359375, -0.112884521484375, -0.02032470703125, 0.072235107421875, 0.164794921875, 0.257354736328125, 0.34991455078125, 0.442474365234375, 0.5350341796875, 0.627593994140625, 0.72015380859375, 0.812713623046875, 0.9052734375, 0.997833251953125, 1.09039306640625, 1.182952880859375, 1.2755126953125, 1.368072509765625, 1.46063232421875, 1.553192138671875, 1.645751953125, 1.738311767578125, 1.83087158203125, 1.923431396484375, 2.0159912109375, 2.108551025390625, 2.20111083984375, 2.293670654296875, 2.38623046875, 2.478790283203125, 2.57135009765625, 2.663909912109375, 2.7564697265625, 2.849029541015625, 2.94158935546875, 3.034149169921875, 3.126708984375, 3.219268798828125, 3.31182861328125, 3.404388427734375, 3.4969482421875, 3.589508056640625, 3.68206787109375, 3.774627685546875, 3.8671875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 11.0, 33.0, 132.0, 256.0, 317.0, 172.0, 51.0, 13.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.981239318847656, -50.22185134887695, -47.462459564208984, -44.70307159423828, -41.94367980957031, -39.18429183959961, -36.424903869628906, -33.66551208496094, -30.906124114990234, -28.1467342376709, -25.387344360351562, -22.62795639038086, -19.868566513061523, -17.109176635742188, -14.349788665771484, -11.590398788452148, -8.831008911132812, -6.071619510650635, -3.312230110168457, -0.5528411865234375, 2.2065486907958984, 4.965938568115234, 7.7253265380859375, 10.484716415405273, 13.24410629272461, 16.003496170043945, 18.76288604736328, 21.522274017333984, 24.28166389465332, 27.041053771972656, 29.80044174194336, 32.55982971191406, 35.31922149658203, 38.078609466552734, 40.8380012512207, 43.597389221191406, 46.356781005859375, 49.11616897583008, 51.87555694580078, 54.63494873046875, 57.39433670043945, 60.153724670410156, 62.913116455078125, 65.67250061035156, 68.43189239501953, 71.1912841796875, 73.95066833496094, 76.7100601196289, 79.46945190429688, 82.22884368896484, 84.98822784423828, 87.74761962890625, 90.50701141357422, 93.26640319824219, 96.02578735351562, 98.7851791381836, 101.54457092285156, 104.30396270751953, 107.06334686279297, 109.82273864746094, 112.5821304321289, 115.34152221679688, 118.10090637207031, 120.86029815673828, 123.61968231201172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 17.0, 13.0, 10.0, 9.0, 19.0, 12.0, 26.0, 20.0, 22.0, 35.0, 37.0, 30.0, 38.0, 45.0, 42.0, 34.0, 44.0, 46.0, 52.0, 39.0, 47.0, 39.0, 23.0, 28.0, 28.0, 23.0, 25.0, 26.0, 28.0, 13.0, 13.0, 15.0, 12.0, 13.0, 15.0, 8.0, 9.0, 2.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-22.928943634033203, -22.27569007873535, -21.6224365234375, -20.969181060791016, -20.315927505493164, -19.662673950195312, -19.009418487548828, -18.356164932250977, -17.702911376953125, -17.049657821655273, -16.396404266357422, -15.743148803710938, -15.089895248413086, -14.436641693115234, -13.783387184143066, -13.130132675170898, -12.476879119873047, -11.823625564575195, -11.170371055603027, -10.51711654663086, -9.863862991333008, -9.210609436035156, -8.557354927062988, -7.9041008949279785, -7.250846862792969, -6.597592830657959, -5.944338798522949, -5.2910847663879395, -4.63783073425293, -3.98457670211792, -3.33132266998291, -2.6780686378479004, -2.0248146057128906, -1.3715605735778809, -0.7183065414428711, -0.06505250930786133, 0.5882015228271484, 1.2414555549621582, 1.894709587097168, 2.5479636192321777, 3.2012176513671875, 3.8544716835021973, 4.507725715637207, 5.160979747772217, 5.814233779907227, 6.467487812042236, 7.120741844177246, 7.773995876312256, 8.427249908447266, 9.080503463745117, 9.733757972717285, 10.387012481689453, 11.040266036987305, 11.693519592285156, 12.346774101257324, 13.000028610229492, 13.653282165527344, 14.306535720825195, 14.959790229797363, 15.613044738769531, 16.266298294067383, 16.919551849365234, 17.57280731201172, 18.22606086730957, 18.879314422607422]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 19.0, 21.0, 31.0, 46.0, 70.0, 65.0, 116.0, 174.0, 255.0, 359.0, 570.0, 888.0, 1474.0, 2514.0, 4841.0, 11158.0, 35015.0, 376870.0, 3685841.0, 47475.0, 13480.0, 5474.0, 2863.0, 1647.0, 967.0, 666.0, 410.0, 275.0, 206.0, 119.0, 93.0, 65.0, 34.0, 32.0, 22.0, 25.0, 19.0, 13.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.3046875, -4.16168212890625, -4.0186767578125, -3.87567138671875, -3.732666015625, -3.58966064453125, -3.4466552734375, -3.30364990234375, -3.16064453125, -3.01763916015625, -2.8746337890625, -2.73162841796875, -2.588623046875, -2.44561767578125, -2.3026123046875, -2.15960693359375, -2.0166015625, -1.87359619140625, -1.7305908203125, -1.58758544921875, -1.444580078125, -1.30157470703125, -1.1585693359375, -1.01556396484375, -0.87255859375, -0.72955322265625, -0.5865478515625, -0.44354248046875, -0.300537109375, -0.15753173828125, -0.0145263671875, 0.12847900390625, 0.271484375, 0.41448974609375, 0.5574951171875, 0.70050048828125, 0.843505859375, 0.98651123046875, 1.1295166015625, 1.27252197265625, 1.41552734375, 1.55853271484375, 1.7015380859375, 1.84454345703125, 1.987548828125, 2.13055419921875, 2.2735595703125, 2.41656494140625, 2.5595703125, 2.70257568359375, 2.8455810546875, 2.98858642578125, 3.131591796875, 3.27459716796875, 3.4176025390625, 3.56060791015625, 3.70361328125, 3.84661865234375, 3.9896240234375, 4.13262939453125, 4.275634765625, 4.41864013671875, 4.5616455078125, 4.70465087890625, 4.84765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 12.0, 8.0, 10.0, 15.0, 16.0, 32.0, 40.0, 41.0, 44.0, 56.0, 60.0, 56.0, 72.0, 76.0, 89.0, 57.0, 61.0, 47.0, 50.0, 39.0, 21.0, 27.0, 15.0, 13.0, 9.0, 13.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.5931549072265625, -1.543731689453125, -1.4943084716796875, -1.44488525390625, -1.3954620361328125, -1.346038818359375, -1.2966156005859375, -1.2471923828125, -1.1977691650390625, -1.148345947265625, -1.0989227294921875, -1.04949951171875, -1.0000762939453125, -0.950653076171875, -0.9012298583984375, -0.851806640625, -0.8023834228515625, -0.752960205078125, -0.7035369873046875, -0.65411376953125, -0.6046905517578125, -0.555267333984375, -0.5058441162109375, -0.4564208984375, -0.4069976806640625, -0.357574462890625, -0.3081512451171875, -0.25872802734375, -0.2093048095703125, -0.159881591796875, -0.1104583740234375, -0.06103515625, -0.0116119384765625, 0.037811279296875, 0.0872344970703125, 0.13665771484375, 0.1860809326171875, 0.235504150390625, 0.2849273681640625, 0.3343505859375, 0.3837738037109375, 0.433197021484375, 0.4826202392578125, 0.53204345703125, 0.5814666748046875, 0.630889892578125, 0.6803131103515625, 0.729736328125, 0.7791595458984375, 0.828582763671875, 0.8780059814453125, 0.92742919921875, 0.9768524169921875, 1.026275634765625, 1.0756988525390625, 1.1251220703125, 1.1745452880859375, 1.223968505859375, 1.2733917236328125, 1.32281494140625, 1.3722381591796875, 1.421661376953125, 1.4710845947265625, 1.5205078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 9.0, 11.0, 17.0, 23.0, 28.0, 30.0, 56.0, 72.0, 98.0, 142.0, 199.0, 319.0, 470.0, 728.0, 1223.0, 2029.0, 3717.0, 6797.0, 14681.0, 39620.0, 237176.0, 3743246.0, 94353.0, 25854.0, 10536.0, 5365.0, 2865.0, 1650.0, 1025.0, 628.0, 421.0, 251.0, 189.0, 132.0, 80.0, 54.0, 40.0, 27.0, 30.0, 14.0, 11.0, 13.0, 12.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.318359375, -3.21234130859375, -3.1063232421875, -3.00030517578125, -2.894287109375, -2.78826904296875, -2.6822509765625, -2.57623291015625, -2.47021484375, -2.36419677734375, -2.2581787109375, -2.15216064453125, -2.046142578125, -1.94012451171875, -1.8341064453125, -1.72808837890625, -1.6220703125, -1.51605224609375, -1.4100341796875, -1.30401611328125, -1.197998046875, -1.09197998046875, -0.9859619140625, -0.87994384765625, -0.77392578125, -0.66790771484375, -0.5618896484375, -0.45587158203125, -0.349853515625, -0.24383544921875, -0.1378173828125, -0.03179931640625, 0.07421875, 0.18023681640625, 0.2862548828125, 0.39227294921875, 0.498291015625, 0.60430908203125, 0.7103271484375, 0.81634521484375, 0.92236328125, 1.02838134765625, 1.1343994140625, 1.24041748046875, 1.346435546875, 1.45245361328125, 1.5584716796875, 1.66448974609375, 1.7705078125, 1.87652587890625, 1.9825439453125, 2.08856201171875, 2.194580078125, 2.30059814453125, 2.4066162109375, 2.51263427734375, 2.61865234375, 2.72467041015625, 2.8306884765625, 2.93670654296875, 3.042724609375, 3.14874267578125, 3.2547607421875, 3.36077880859375, 3.466796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 3.0, 9.0, 9.0, 14.0, 15.0, 26.0, 28.0, 56.0, 94.0, 248.0, 2852.0, 360.0, 144.0, 59.0, 29.0, 25.0, 21.0, 10.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6748046875, -1.62347412109375, -1.5721435546875, -1.52081298828125, -1.469482421875, -1.41815185546875, -1.3668212890625, -1.31549072265625, -1.26416015625, -1.21282958984375, -1.1614990234375, -1.11016845703125, -1.058837890625, -1.00750732421875, -0.9561767578125, -0.90484619140625, -0.853515625, -0.80218505859375, -0.7508544921875, -0.69952392578125, -0.648193359375, -0.59686279296875, -0.5455322265625, -0.49420166015625, -0.44287109375, -0.39154052734375, -0.3402099609375, -0.28887939453125, -0.237548828125, -0.18621826171875, -0.1348876953125, -0.08355712890625, -0.0322265625, 0.01910400390625, 0.0704345703125, 0.12176513671875, 0.173095703125, 0.22442626953125, 0.2757568359375, 0.32708740234375, 0.37841796875, 0.42974853515625, 0.4810791015625, 0.53240966796875, 0.583740234375, 0.63507080078125, 0.6864013671875, 0.73773193359375, 0.7890625, 0.84039306640625, 0.8917236328125, 0.94305419921875, 0.994384765625, 1.04571533203125, 1.0970458984375, 1.14837646484375, 1.19970703125, 1.25103759765625, 1.3023681640625, 1.35369873046875, 1.405029296875, 1.45635986328125, 1.5076904296875, 1.55902099609375, 1.6103515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 14.0, 13.0, 22.0, 23.0, 50.0, 53.0, 81.0, 102.0, 98.0, 123.0, 79.0, 68.0, 63.0, 45.0, 47.0, 28.0, 17.0, 13.0, 16.0, 10.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.317131042480469, -6.099594593048096, -5.882058620452881, -5.664522171020508, -5.446985721588135, -5.229449272155762, -5.011913299560547, -4.794376850128174, -4.576840400695801, -4.359303951263428, -4.141767978668213, -3.92423152923584, -3.706695079803467, -3.489158868789673, -3.271622657775879, -3.054086208343506, -2.836549997329712, -2.619013786315918, -2.401477336883545, -2.183941125869751, -1.966404676437378, -1.748868465423584, -1.5313321352005005, -1.313795804977417, -1.0962594747543335, -0.87872314453125, -0.6611868143081665, -0.4436505436897278, -0.2261142134666443, -0.008577942848205566, 0.20895838737487793, 0.4264947175979614, 0.6440310478210449, 0.8615673780441284, 1.079103708267212, 1.2966399192810059, 1.514176368713379, 1.7317125797271729, 1.9492489099502563, 2.16678524017334, 2.384321689605713, 2.601857900619507, 2.81939435005188, 3.036930561065674, 3.254467010498047, 3.472003221511841, 3.6895394325256348, 3.907075881958008, 4.124611854553223, 4.342148303985596, 4.5596842765808105, 4.777220726013184, 4.994757175445557, 5.21229362487793, 5.4298295974731445, 5.647366046905518, 5.864902496337891, 6.082438945770264, 6.2999749183654785, 6.517511367797852, 6.735047817230225, 6.952584266662598, 7.1701202392578125, 7.3876566886901855, 7.605193138122559]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 2.0, 5.0, 6.0, 10.0, 11.0, 17.0, 26.0, 15.0, 23.0, 25.0, 33.0, 31.0, 46.0, 42.0, 38.0, 39.0, 46.0, 51.0, 54.0, 39.0, 36.0, 47.0, 43.0, 26.0, 39.0, 37.0, 31.0, 40.0, 20.0, 25.0, 24.0, 14.0, 11.0, 7.0, 8.0, 7.0, 2.0, 8.0, 3.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.618462562561035, -4.480080604553223, -4.341698169708252, -4.2033162117004395, -4.064933776855469, -3.9265518188476562, -3.7881698608398438, -3.649787664413452, -3.5114054679870605, -3.373023271560669, -3.2346410751342773, -3.096259117126465, -2.9578769207000732, -2.8194947242736816, -2.681112766265869, -2.5427305698394775, -2.404348373413086, -2.2659661769866943, -2.1275839805603027, -1.9892020225524902, -1.8508198261260986, -1.712437629699707, -1.574055552482605, -1.435673475265503, -1.2972912788391113, -1.1589090824127197, -1.0205270051956177, -0.8821448683738708, -0.743762731552124, -0.6053805947303772, -0.46699845790863037, -0.32861632108688354, -0.19023466110229492, -0.051852524280548096, 0.08652961254119873, 0.22491174936294556, 0.3632938861846924, 0.5016760230064392, 0.640058159828186, 0.7784402966499329, 0.9168224334716797, 1.0552046298980713, 1.1935867071151733, 1.3319687843322754, 1.470350980758667, 1.6087331771850586, 1.7471152544021606, 1.8854973316192627, 2.0238795280456543, 2.162261724472046, 2.3006439208984375, 2.43902587890625, 2.5774080753326416, 2.715790271759033, 2.8541722297668457, 2.9925544261932373, 3.130936622619629, 3.2693188190460205, 3.407701015472412, 3.5460829734802246, 3.684465169906616, 3.822847366333008, 3.9612293243408203, 4.099611759185791, 4.2379937171936035]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 15.0, 20.0, 20.0, 47.0, 58.0, 96.0, 165.0, 360.0, 578.0, 1136.0, 2419.0, 5618.0, 14408.0, 41607.0, 124600.0, 343318.0, 331931.0, 118411.0, 39637.0, 13982.0, 5386.0, 2362.0, 1063.0, 558.0, 274.0, 197.0, 99.0, 52.0, 47.0, 23.0, 16.0, 6.0, 14.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.067779541015625, -3.94805908203125, -3.828338623046875, -3.7086181640625, -3.588897705078125, -3.46917724609375, -3.349456787109375, -3.229736328125, -3.110015869140625, -2.99029541015625, -2.870574951171875, -2.7508544921875, -2.631134033203125, -2.51141357421875, -2.391693115234375, -2.27197265625, -2.152252197265625, -2.03253173828125, -1.912811279296875, -1.7930908203125, -1.673370361328125, -1.55364990234375, -1.433929443359375, -1.314208984375, -1.194488525390625, -1.07476806640625, -0.955047607421875, -0.8353271484375, -0.715606689453125, -0.59588623046875, -0.476165771484375, -0.3564453125, -0.236724853515625, -0.11700439453125, 0.002716064453125, 0.1224365234375, 0.242156982421875, 0.36187744140625, 0.481597900390625, 0.601318359375, 0.721038818359375, 0.84075927734375, 0.960479736328125, 1.0802001953125, 1.199920654296875, 1.31964111328125, 1.439361572265625, 1.55908203125, 1.678802490234375, 1.79852294921875, 1.918243408203125, 2.0379638671875, 2.157684326171875, 2.27740478515625, 2.397125244140625, 2.516845703125, 2.636566162109375, 2.75628662109375, 2.876007080078125, 2.9957275390625, 3.115447998046875, 3.23516845703125, 3.354888916015625, 3.474609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 16.0, 14.0, 14.0, 18.0, 31.0, 29.0, 37.0, 59.0, 62.0, 59.0, 74.0, 74.0, 80.0, 63.0, 64.0, 58.0, 52.0, 50.0, 38.0, 22.0, 24.0, 14.0, 16.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.142578125, -2.0877838134765625, -2.032989501953125, -1.9781951904296875, -1.92340087890625, -1.8686065673828125, -1.813812255859375, -1.7590179443359375, -1.7042236328125, -1.6494293212890625, -1.594635009765625, -1.5398406982421875, -1.48504638671875, -1.4302520751953125, -1.375457763671875, -1.3206634521484375, -1.265869140625, -1.2110748291015625, -1.156280517578125, -1.1014862060546875, -1.04669189453125, -0.9918975830078125, -0.937103271484375, -0.8823089599609375, -0.8275146484375, -0.7727203369140625, -0.717926025390625, -0.6631317138671875, -0.60833740234375, -0.5535430908203125, -0.498748779296875, -0.4439544677734375, -0.38916015625, -0.3343658447265625, -0.279571533203125, -0.2247772216796875, -0.16998291015625, -0.1151885986328125, -0.060394287109375, -0.0055999755859375, 0.0491943359375, 0.1039886474609375, 0.158782958984375, 0.2135772705078125, 0.26837158203125, 0.3231658935546875, 0.377960205078125, 0.4327545166015625, 0.487548828125, 0.5423431396484375, 0.597137451171875, 0.6519317626953125, 0.70672607421875, 0.7615203857421875, 0.816314697265625, 0.8711090087890625, 0.9259033203125, 0.9806976318359375, 1.035491943359375, 1.0902862548828125, 1.14508056640625, 1.1998748779296875, 1.254669189453125, 1.3094635009765625, 1.3642578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 8.0, 22.0, 14.0, 28.0, 32.0, 42.0, 57.0, 81.0, 83.0, 137.0, 193.0, 301.0, 405.0, 596.0, 984.0, 1982.0, 5631.0, 25569.0, 206955.0, 673430.0, 108046.0, 15447.0, 4075.0, 1641.0, 911.0, 526.0, 354.0, 260.0, 161.0, 125.0, 100.0, 79.0, 55.0, 53.0, 41.0, 29.0, 20.0, 13.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.421875, -5.2371826171875, -5.052490234375, -4.8677978515625, -4.68310546875, -4.4984130859375, -4.313720703125, -4.1290283203125, -3.9443359375, -3.7596435546875, -3.574951171875, -3.3902587890625, -3.20556640625, -3.0208740234375, -2.836181640625, -2.6514892578125, -2.466796875, -2.2821044921875, -2.097412109375, -1.9127197265625, -1.72802734375, -1.5433349609375, -1.358642578125, -1.1739501953125, -0.9892578125, -0.8045654296875, -0.619873046875, -0.4351806640625, -0.25048828125, -0.0657958984375, 0.118896484375, 0.3035888671875, 0.48828125, 0.6729736328125, 0.857666015625, 1.0423583984375, 1.22705078125, 1.4117431640625, 1.596435546875, 1.7811279296875, 1.9658203125, 2.1505126953125, 2.335205078125, 2.5198974609375, 2.70458984375, 2.8892822265625, 3.073974609375, 3.2586669921875, 3.443359375, 3.6280517578125, 3.812744140625, 3.9974365234375, 4.18212890625, 4.3668212890625, 4.551513671875, 4.7362060546875, 4.9208984375, 5.1055908203125, 5.290283203125, 5.4749755859375, 5.65966796875, 5.8443603515625, 6.029052734375, 6.2137451171875, 6.3984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 7.0, 2.0, 7.0, 13.0, 5.0, 12.0, 21.0, 31.0, 19.0, 17.0, 19.0, 28.0, 29.0, 47.0, 46.0, 53.0, 37.0, 46.0, 42.0, 34.0, 45.0, 46.0, 35.0, 32.0, 40.0, 34.0, 32.0, 32.0, 27.0, 26.0, 19.0, 19.0, 28.0, 10.0, 11.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-4.921875, -4.77581787109375, -4.6297607421875, -4.48370361328125, -4.337646484375, -4.19158935546875, -4.0455322265625, -3.89947509765625, -3.75341796875, -3.60736083984375, -3.4613037109375, -3.31524658203125, -3.169189453125, -3.02313232421875, -2.8770751953125, -2.73101806640625, -2.5849609375, -2.43890380859375, -2.2928466796875, -2.14678955078125, -2.000732421875, -1.85467529296875, -1.7086181640625, -1.56256103515625, -1.41650390625, -1.27044677734375, -1.1243896484375, -0.97833251953125, -0.832275390625, -0.68621826171875, -0.5401611328125, -0.39410400390625, -0.248046875, -0.10198974609375, 0.0440673828125, 0.19012451171875, 0.336181640625, 0.48223876953125, 0.6282958984375, 0.77435302734375, 0.92041015625, 1.06646728515625, 1.2125244140625, 1.35858154296875, 1.504638671875, 1.65069580078125, 1.7967529296875, 1.94281005859375, 2.0888671875, 2.23492431640625, 2.3809814453125, 2.52703857421875, 2.673095703125, 2.81915283203125, 2.9652099609375, 3.11126708984375, 3.25732421875, 3.40338134765625, 3.5494384765625, 3.69549560546875, 3.841552734375, 3.98760986328125, 4.1336669921875, 4.27972412109375, 4.42578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 12.0, 10.0, 9.0, 18.0, 27.0, 39.0, 44.0, 80.0, 130.0, 167.0, 313.0, 652.0, 1405.0, 3634.0, 12229.0, 62037.0, 472520.0, 421074.0, 56377.0, 11474.0, 3457.0, 1357.0, 644.0, 335.0, 189.0, 101.0, 62.0, 50.0, 28.0, 23.0, 16.0, 18.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.2176513671875, -2.156005859375, -2.0943603515625, -2.03271484375, -1.9710693359375, -1.909423828125, -1.8477783203125, -1.7861328125, -1.7244873046875, -1.662841796875, -1.6011962890625, -1.53955078125, -1.4779052734375, -1.416259765625, -1.3546142578125, -1.29296875, -1.2313232421875, -1.169677734375, -1.1080322265625, -1.04638671875, -0.9847412109375, -0.923095703125, -0.8614501953125, -0.7998046875, -0.7381591796875, -0.676513671875, -0.6148681640625, -0.55322265625, -0.4915771484375, -0.429931640625, -0.3682861328125, -0.306640625, -0.2449951171875, -0.183349609375, -0.1217041015625, -0.06005859375, 0.0015869140625, 0.063232421875, 0.1248779296875, 0.1865234375, 0.2481689453125, 0.309814453125, 0.3714599609375, 0.43310546875, 0.4947509765625, 0.556396484375, 0.6180419921875, 0.6796875, 0.7413330078125, 0.802978515625, 0.8646240234375, 0.92626953125, 0.9879150390625, 1.049560546875, 1.1112060546875, 1.1728515625, 1.2344970703125, 1.296142578125, 1.3577880859375, 1.41943359375, 1.4810791015625, 1.542724609375, 1.6043701171875, 1.666015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 9.0, 12.0, 13.0, 30.0, 21.0, 32.0, 29.0, 54.0, 54.0, 89.0, 95.0, 134.0, 102.0, 77.0, 69.0, 35.0, 31.0, 32.0, 14.0, 13.0, 8.0, 9.0, 4.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003619194030761719, -0.0003490746021270752, -0.0003362298011779785, -0.00032338500022888184, -0.00031054019927978516, -0.0002976953983306885, -0.0002848505973815918, -0.0002720057964324951, -0.00025916099548339844, -0.00024631619453430176, -0.00023347139358520508, -0.0002206265926361084, -0.00020778179168701172, -0.00019493699073791504, -0.00018209218978881836, -0.00016924738883972168, -0.000156402587890625, -0.00014355778694152832, -0.00013071298599243164, -0.00011786818504333496, -0.00010502338409423828, -9.21785831451416e-05, -7.933378219604492e-05, -6.648898124694824e-05, -5.364418029785156e-05, -4.079937934875488e-05, -2.7954578399658203e-05, -1.5109777450561523e-05, -2.2649765014648438e-06, 1.0579824447631836e-05, 2.3424625396728516e-05, 3.6269426345825195e-05, 4.9114227294921875e-05, 6.195902824401855e-05, 7.480382919311523e-05, 8.764863014221191e-05, 0.0001004934310913086, 0.00011333823204040527, 0.00012618303298950195, 0.00013902783393859863, 0.0001518726348876953, 0.000164717435836792, 0.00017756223678588867, 0.00019040703773498535, 0.00020325183868408203, 0.0002160966396331787, 0.0002289414405822754, 0.00024178624153137207, 0.00025463104248046875, 0.00026747584342956543, 0.0002803206443786621, 0.0002931654453277588, 0.00030601024627685547, 0.00031885504722595215, 0.00033169984817504883, 0.0003445446491241455, 0.0003573894500732422, 0.00037023425102233887, 0.00038307905197143555, 0.0003959238529205322, 0.0004087686538696289, 0.0004216134548187256, 0.00043445825576782227, 0.00044730305671691895, 0.0004601478576660156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 22.0, 21.0, 44.0, 62.0, 101.0, 172.0, 284.0, 562.0, 1133.0, 2713.0, 10442.0, 82826.0, 720715.0, 203158.0, 19145.0, 4042.0, 1485.0, 659.0, 404.0, 189.0, 130.0, 70.0, 41.0, 28.0, 30.0, 17.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.951171875, -2.872833251953125, -2.79449462890625, -2.716156005859375, -2.6378173828125, -2.559478759765625, -2.48114013671875, -2.402801513671875, -2.324462890625, -2.246124267578125, -2.16778564453125, -2.089447021484375, -2.0111083984375, -1.932769775390625, -1.85443115234375, -1.776092529296875, -1.69775390625, -1.619415283203125, -1.54107666015625, -1.462738037109375, -1.3843994140625, -1.306060791015625, -1.22772216796875, -1.149383544921875, -1.071044921875, -0.992706298828125, -0.91436767578125, -0.836029052734375, -0.7576904296875, -0.679351806640625, -0.60101318359375, -0.522674560546875, -0.4443359375, -0.365997314453125, -0.28765869140625, -0.209320068359375, -0.1309814453125, -0.052642822265625, 0.02569580078125, 0.104034423828125, 0.182373046875, 0.260711669921875, 0.33905029296875, 0.417388916015625, 0.4957275390625, 0.574066162109375, 0.65240478515625, 0.730743408203125, 0.80908203125, 0.887420654296875, 0.96575927734375, 1.044097900390625, 1.1224365234375, 1.200775146484375, 1.27911376953125, 1.357452392578125, 1.435791015625, 1.514129638671875, 1.59246826171875, 1.670806884765625, 1.7491455078125, 1.827484130859375, 1.90582275390625, 1.984161376953125, 2.0625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 10.0, 2.0, 10.0, 4.0, 4.0, 16.0, 12.0, 16.0, 27.0, 23.0, 38.0, 37.0, 48.0, 50.0, 69.0, 63.0, 75.0, 73.0, 71.0, 58.0, 51.0, 47.0, 28.0, 31.0, 21.0, 27.0, 20.0, 12.0, 10.0, 12.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.587890625, -1.542510986328125, -1.49713134765625, -1.451751708984375, -1.4063720703125, -1.360992431640625, -1.31561279296875, -1.270233154296875, -1.224853515625, -1.179473876953125, -1.13409423828125, -1.088714599609375, -1.0433349609375, -0.997955322265625, -0.95257568359375, -0.907196044921875, -0.86181640625, -0.816436767578125, -0.77105712890625, -0.725677490234375, -0.6802978515625, -0.634918212890625, -0.58953857421875, -0.544158935546875, -0.498779296875, -0.453399658203125, -0.40802001953125, -0.362640380859375, -0.3172607421875, -0.271881103515625, -0.22650146484375, -0.181121826171875, -0.1357421875, -0.090362548828125, -0.04498291015625, 0.000396728515625, 0.0457763671875, 0.091156005859375, 0.13653564453125, 0.181915283203125, 0.227294921875, 0.272674560546875, 0.31805419921875, 0.363433837890625, 0.4088134765625, 0.454193115234375, 0.49957275390625, 0.544952392578125, 0.59033203125, 0.635711669921875, 0.68109130859375, 0.726470947265625, 0.7718505859375, 0.817230224609375, 0.86260986328125, 0.907989501953125, 0.953369140625, 0.998748779296875, 1.04412841796875, 1.089508056640625, 1.1348876953125, 1.180267333984375, 1.22564697265625, 1.271026611328125, 1.31640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 22.0, 35.0, 76.0, 165.0, 249.0, 227.0, 126.0, 49.0, 24.0, 16.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.57037353515625, -104.38743591308594, -102.20449829101562, -100.02156066894531, -97.838623046875, -95.65568542480469, -93.47274780273438, -91.28980255126953, -89.10686492919922, -86.9239273071289, -84.7409896850586, -82.55805206298828, -80.37511444091797, -78.19216918945312, -76.00923156738281, -73.8262939453125, -71.64335632324219, -69.46041870117188, -67.27748107910156, -65.09454345703125, -62.91160202026367, -60.72866439819336, -58.54572677612305, -56.362789154052734, -54.17985534667969, -51.996917724609375, -49.81398010253906, -47.63104248046875, -45.44810104370117, -43.26516342163086, -41.08222579956055, -38.899288177490234, -36.716346740722656, -34.533409118652344, -32.35047149658203, -30.167531967163086, -27.98459243774414, -25.801654815673828, -23.618717193603516, -21.435779571533203, -19.252840042114258, -17.069902420043945, -14.886962890625, -12.704025268554688, -10.521086692810059, -8.33814811706543, -6.155210494995117, -3.9722719192504883, -1.7893333435058594, 0.39360499382019043, 2.5765433311462402, 4.759481430053711, 6.94242000579834, 9.125358581542969, 11.308296203613281, 13.49123477935791, 15.674173355102539, 17.85711097717285, 20.040050506591797, 22.22298812866211, 24.405925750732422, 26.588865280151367, 28.77180290222168, 30.954742431640625, 33.13768005371094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 16.0, 17.0, 30.0, 24.0, 31.0, 48.0, 40.0, 59.0, 68.0, 62.0, 49.0, 73.0, 65.0, 62.0, 76.0, 53.0, 48.0, 40.0, 26.0, 26.0, 15.0, 16.0, 13.0, 5.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.112730026245117, -18.176864624023438, -17.24100112915039, -16.30513572692871, -15.369270324707031, -14.433404922485352, -13.497540473937988, -12.561676025390625, -11.625810623168945, -10.689945220947266, -9.754080772399902, -8.818216323852539, -7.882350921630859, -6.946485996246338, -6.010621070861816, -5.074756145477295, -4.138891220092773, -3.203026294708252, -2.2671613693237305, -1.331296443939209, -0.3954315185546875, 0.540433406829834, 1.4762983322143555, 2.412163257598877, 3.3480281829833984, 4.28389310836792, 5.219758033752441, 6.155622959136963, 7.091487884521484, 8.027353286743164, 8.963217735290527, 9.89908218383789, 10.834945678710938, 11.770811080932617, 12.70667552947998, 13.642539978027344, 14.578405380249023, 15.514270782470703, 16.45013427734375, 17.38599967956543, 18.32186508178711, 19.25773048400879, 20.19359588623047, 21.129459381103516, 22.065324783325195, 23.001190185546875, 23.937053680419922, 24.8729190826416, 25.80878448486328, 26.74464988708496, 27.68051528930664, 28.616378784179688, 29.552244186401367, 30.488109588623047, 31.423973083496094, 32.359840393066406, 33.29570388793945, 34.2315673828125, 35.16743469238281, 36.10329818725586, 37.039161682128906, 37.97502899169922, 38.910892486572266, 39.84675979614258, 40.782623291015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 10.0, 19.0, 28.0, 54.0, 98.0, 208.0, 441.0, 952.0, 2520.0, 7383.0, 26585.0, 141290.0, 3091733.0, 835447.0, 64695.0, 15095.0, 4623.0, 1691.0, 663.0, 326.0, 168.0, 110.0, 54.0, 29.0, 21.0, 16.0, 10.0, 5.0, 9.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.329620361328125, -2.21197509765625, -2.094329833984375, -1.9766845703125, -1.859039306640625, -1.74139404296875, -1.623748779296875, -1.506103515625, -1.388458251953125, -1.27081298828125, -1.153167724609375, -1.0355224609375, -0.917877197265625, -0.80023193359375, -0.682586669921875, -0.56494140625, -0.447296142578125, -0.32965087890625, -0.212005615234375, -0.0943603515625, 0.023284912109375, 0.14093017578125, 0.258575439453125, 0.376220703125, 0.493865966796875, 0.61151123046875, 0.729156494140625, 0.8468017578125, 0.964447021484375, 1.08209228515625, 1.199737548828125, 1.3173828125, 1.435028076171875, 1.55267333984375, 1.670318603515625, 1.7879638671875, 1.905609130859375, 2.02325439453125, 2.140899658203125, 2.258544921875, 2.376190185546875, 2.49383544921875, 2.611480712890625, 2.7291259765625, 2.846771240234375, 2.96441650390625, 3.082061767578125, 3.19970703125, 3.317352294921875, 3.43499755859375, 3.552642822265625, 3.6702880859375, 3.787933349609375, 3.90557861328125, 4.023223876953125, 4.140869140625, 4.258514404296875, 4.37615966796875, 4.493804931640625, 4.6114501953125, 4.729095458984375, 4.84674072265625, 4.964385986328125, 5.08203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 13.0, 13.0, 22.0, 32.0, 32.0, 52.0, 72.0, 80.0, 78.0, 102.0, 108.0, 92.0, 74.0, 62.0, 53.0, 44.0, 23.0, 21.0, 8.0, 9.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.23602294921875, -1.1673583984375, -1.09869384765625, -1.030029296875, -0.96136474609375, -0.8927001953125, -0.82403564453125, -0.75537109375, -0.68670654296875, -0.6180419921875, -0.54937744140625, -0.480712890625, -0.41204833984375, -0.3433837890625, -0.27471923828125, -0.2060546875, -0.13739013671875, -0.0687255859375, -6.103515625e-05, 0.068603515625, 0.13726806640625, 0.2059326171875, 0.27459716796875, 0.34326171875, 0.41192626953125, 0.4805908203125, 0.54925537109375, 0.617919921875, 0.68658447265625, 0.7552490234375, 0.82391357421875, 0.892578125, 0.96124267578125, 1.0299072265625, 1.09857177734375, 1.167236328125, 1.23590087890625, 1.3045654296875, 1.37322998046875, 1.44189453125, 1.51055908203125, 1.5792236328125, 1.64788818359375, 1.716552734375, 1.78521728515625, 1.8538818359375, 1.92254638671875, 1.9912109375, 2.05987548828125, 2.1285400390625, 2.19720458984375, 2.265869140625, 2.33453369140625, 2.4031982421875, 2.47186279296875, 2.54052734375, 2.60919189453125, 2.6778564453125, 2.74652099609375, 2.815185546875, 2.88385009765625, 2.9525146484375, 3.02117919921875, 3.08984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 11.0, 12.0, 14.0, 25.0, 36.0, 79.0, 168.0, 405.0, 1192.0, 3649.0, 13443.0, 63534.0, 911125.0, 3059894.0, 111911.0, 20498.0, 5397.0, 1671.0, 617.0, 277.0, 140.0, 58.0, 41.0, 26.0, 10.0, 6.0, 15.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.48114013671875, -4.3372802734375, -4.19342041015625, -4.049560546875, -3.90570068359375, -3.7618408203125, -3.61798095703125, -3.47412109375, -3.33026123046875, -3.1864013671875, -3.04254150390625, -2.898681640625, -2.75482177734375, -2.6109619140625, -2.46710205078125, -2.3232421875, -2.17938232421875, -2.0355224609375, -1.89166259765625, -1.747802734375, -1.60394287109375, -1.4600830078125, -1.31622314453125, -1.17236328125, -1.02850341796875, -0.8846435546875, -0.74078369140625, -0.596923828125, -0.45306396484375, -0.3092041015625, -0.16534423828125, -0.021484375, 0.12237548828125, 0.2662353515625, 0.41009521484375, 0.553955078125, 0.69781494140625, 0.8416748046875, 0.98553466796875, 1.12939453125, 1.27325439453125, 1.4171142578125, 1.56097412109375, 1.704833984375, 1.84869384765625, 1.9925537109375, 2.13641357421875, 2.2802734375, 2.42413330078125, 2.5679931640625, 2.71185302734375, 2.855712890625, 2.99957275390625, 3.1434326171875, 3.28729248046875, 3.43115234375, 3.57501220703125, 3.7188720703125, 3.86273193359375, 4.006591796875, 4.15045166015625, 4.2943115234375, 4.43817138671875, 4.58203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 11.0, 17.0, 23.0, 24.0, 42.0, 41.0, 80.0, 113.0, 181.0, 333.0, 731.0, 1085.0, 589.0, 285.0, 185.0, 85.0, 56.0, 48.0, 33.0, 18.0, 14.0, 10.0, 12.0, 7.0, 6.0, 4.0, 2.0, 3.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.5133056640625, -3.393798828125, -3.2742919921875, -3.15478515625, -3.0352783203125, -2.915771484375, -2.7962646484375, -2.6767578125, -2.5572509765625, -2.437744140625, -2.3182373046875, -2.19873046875, -2.0792236328125, -1.959716796875, -1.8402099609375, -1.720703125, -1.6011962890625, -1.481689453125, -1.3621826171875, -1.24267578125, -1.1231689453125, -1.003662109375, -0.8841552734375, -0.7646484375, -0.6451416015625, -0.525634765625, -0.4061279296875, -0.28662109375, -0.1671142578125, -0.047607421875, 0.0718994140625, 0.19140625, 0.3109130859375, 0.430419921875, 0.5499267578125, 0.66943359375, 0.7889404296875, 0.908447265625, 1.0279541015625, 1.1474609375, 1.2669677734375, 1.386474609375, 1.5059814453125, 1.62548828125, 1.7449951171875, 1.864501953125, 1.9840087890625, 2.103515625, 2.2230224609375, 2.342529296875, 2.4620361328125, 2.58154296875, 2.7010498046875, 2.820556640625, 2.9400634765625, 3.0595703125, 3.1790771484375, 3.298583984375, 3.4180908203125, 3.53759765625, 3.6571044921875, 3.776611328125, 3.8961181640625, 4.015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 11.0, 13.0, 25.0, 30.0, 57.0, 87.0, 169.0, 181.0, 161.0, 114.0, 69.0, 38.0, 19.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.05354690551758, -40.87858963012695, -39.70363235473633, -38.5286750793457, -37.35371398925781, -36.17875671386719, -35.00379943847656, -33.82884216308594, -32.65388488769531, -31.478927612304688, -30.303970336914062, -29.129011154174805, -27.95405387878418, -26.779096603393555, -25.604137420654297, -24.429180145263672, -23.254222869873047, -22.079265594482422, -20.904308319091797, -19.72934913635254, -18.554391860961914, -17.37943458557129, -16.20447540283203, -15.029518127441406, -13.854560852050781, -12.679603576660156, -11.504645347595215, -10.329687118530273, -9.154729843139648, -7.979772090911865, -6.804814338684082, -5.629856109619141, -4.45489501953125, -3.279937267303467, -2.1049795150756836, -0.9300217628479004, 0.2449359893798828, 1.419893741607666, 2.594851493835449, 3.7698097229003906, 4.944766998291016, 6.119724750518799, 7.294682502746582, 8.469640731811523, 9.644598007202148, 10.819555282592773, 11.994513511657715, 13.169471740722656, 14.344429016113281, 15.519386291503906, 16.69434356689453, 17.86930274963379, 19.044260025024414, 20.21921730041504, 21.394176483154297, 22.569133758544922, 23.744091033935547, 24.919048309326172, 26.094005584716797, 27.268964767456055, 28.44392204284668, 29.618879318237305, 30.793838500976562, 31.968795776367188, 33.14375305175781]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 12.0, 20.0, 14.0, 25.0, 35.0, 44.0, 46.0, 36.0, 58.0, 30.0, 44.0, 55.0, 57.0, 59.0, 47.0, 48.0, 53.0, 39.0, 35.0, 41.0, 31.0, 21.0, 25.0, 15.0, 18.0, 17.0, 12.0, 7.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.869686126708984, -18.338943481445312, -17.80820083618164, -17.27745819091797, -16.746715545654297, -16.215970993041992, -15.68522834777832, -15.154485702514648, -14.623743057250977, -14.093000411987305, -13.562257766723633, -13.031514167785645, -12.500771522521973, -11.9700288772583, -11.439285278320312, -10.90854263305664, -10.377799987792969, -9.847057342529297, -9.316314697265625, -8.785571098327637, -8.254828453063965, -7.724085807800293, -7.193342685699463, -6.662599563598633, -6.131856918334961, -5.601114273071289, -5.070371150970459, -4.539628028869629, -4.008885383605957, -3.478142499923706, -2.947399616241455, -2.416656732559204, -1.885915756225586, -1.355172872543335, -0.824429988861084, -0.293687105178833, 0.23705577850341797, 0.767798662185669, 1.29854154586792, 1.829284429550171, 2.360027313232422, 2.890770196914673, 3.421513080596924, 3.952255964279175, 4.482998847961426, 5.013741493225098, 5.544484615325928, 6.075227737426758, 6.60597038269043, 7.136713027954102, 7.667456150054932, 8.198199272155762, 8.728941917419434, 9.259684562683105, 9.790428161621094, 10.321170806884766, 10.851913452148438, 11.38265609741211, 11.913398742675781, 12.44414234161377, 12.974884986877441, 13.505627632141113, 14.036371231079102, 14.567113876342773, 15.097856521606445]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 7.0, 17.0, 17.0, 21.0, 36.0, 43.0, 75.0, 86.0, 142.0, 246.0, 345.0, 598.0, 1013.0, 1778.0, 3083.0, 5582.0, 10908.0, 21798.0, 45839.0, 101938.0, 243728.0, 330494.0, 151503.0, 66454.0, 30680.0, 14831.0, 7568.0, 3949.0, 2295.0, 1346.0, 757.0, 490.0, 300.0, 168.0, 128.0, 88.0, 67.0, 35.0, 28.0, 19.0, 23.0, 8.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.483001708984375, -2.40350341796875, -2.324005126953125, -2.2445068359375, -2.165008544921875, -2.08551025390625, -2.006011962890625, -1.926513671875, -1.847015380859375, -1.76751708984375, -1.688018798828125, -1.6085205078125, -1.529022216796875, -1.44952392578125, -1.370025634765625, -1.29052734375, -1.211029052734375, -1.13153076171875, -1.052032470703125, -0.9725341796875, -0.893035888671875, -0.81353759765625, -0.734039306640625, -0.654541015625, -0.575042724609375, -0.49554443359375, -0.416046142578125, -0.3365478515625, -0.257049560546875, -0.17755126953125, -0.098052978515625, -0.0185546875, 0.060943603515625, 0.14044189453125, 0.219940185546875, 0.2994384765625, 0.378936767578125, 0.45843505859375, 0.537933349609375, 0.617431640625, 0.696929931640625, 0.77642822265625, 0.855926513671875, 0.9354248046875, 1.014923095703125, 1.09442138671875, 1.173919677734375, 1.25341796875, 1.332916259765625, 1.41241455078125, 1.491912841796875, 1.5714111328125, 1.650909423828125, 1.73040771484375, 1.809906005859375, 1.889404296875, 1.968902587890625, 2.04840087890625, 2.127899169921875, 2.2073974609375, 2.286895751953125, 2.36639404296875, 2.445892333984375, 2.525390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 19.0, 23.0, 25.0, 26.0, 30.0, 34.0, 41.0, 48.0, 59.0, 59.0, 64.0, 67.0, 74.0, 41.0, 63.0, 52.0, 38.0, 43.0, 37.0, 34.0, 28.0, 18.0, 20.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.07696533203125, -1.0299072265625, -0.98284912109375, -0.935791015625, -0.88873291015625, -0.8416748046875, -0.79461669921875, -0.74755859375, -0.70050048828125, -0.6534423828125, -0.60638427734375, -0.559326171875, -0.51226806640625, -0.4652099609375, -0.41815185546875, -0.37109375, -0.32403564453125, -0.2769775390625, -0.22991943359375, -0.182861328125, -0.13580322265625, -0.0887451171875, -0.04168701171875, 0.00537109375, 0.05242919921875, 0.0994873046875, 0.14654541015625, 0.193603515625, 0.24066162109375, 0.2877197265625, 0.33477783203125, 0.3818359375, 0.42889404296875, 0.4759521484375, 0.52301025390625, 0.570068359375, 0.61712646484375, 0.6641845703125, 0.71124267578125, 0.75830078125, 0.80535888671875, 0.8524169921875, 0.89947509765625, 0.946533203125, 0.99359130859375, 1.0406494140625, 1.08770751953125, 1.134765625, 1.18182373046875, 1.2288818359375, 1.27593994140625, 1.322998046875, 1.37005615234375, 1.4171142578125, 1.46417236328125, 1.51123046875, 1.55828857421875, 1.6053466796875, 1.65240478515625, 1.699462890625, 1.74652099609375, 1.7935791015625, 1.84063720703125, 1.8876953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 5.0, 2.0, 10.0, 6.0, 11.0, 9.0, 13.0, 26.0, 23.0, 38.0, 62.0, 68.0, 110.0, 172.0, 264.0, 498.0, 867.0, 1781.0, 5889.0, 40680.0, 736795.0, 237359.0, 17139.0, 3616.0, 1349.0, 629.0, 422.0, 237.0, 149.0, 91.0, 72.0, 45.0, 34.0, 23.0, 18.0, 14.0, 8.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.06341552734375, -6.8182373046875, -6.57305908203125, -6.327880859375, -6.08270263671875, -5.8375244140625, -5.59234619140625, -5.34716796875, -5.10198974609375, -4.8568115234375, -4.61163330078125, -4.366455078125, -4.12127685546875, -3.8760986328125, -3.63092041015625, -3.3857421875, -3.14056396484375, -2.8953857421875, -2.65020751953125, -2.405029296875, -2.15985107421875, -1.9146728515625, -1.66949462890625, -1.42431640625, -1.17913818359375, -0.9339599609375, -0.68878173828125, -0.443603515625, -0.19842529296875, 0.0467529296875, 0.29193115234375, 0.537109375, 0.78228759765625, 1.0274658203125, 1.27264404296875, 1.517822265625, 1.76300048828125, 2.0081787109375, 2.25335693359375, 2.49853515625, 2.74371337890625, 2.9888916015625, 3.23406982421875, 3.479248046875, 3.72442626953125, 3.9696044921875, 4.21478271484375, 4.4599609375, 4.70513916015625, 4.9503173828125, 5.19549560546875, 5.440673828125, 5.68585205078125, 5.9310302734375, 6.17620849609375, 6.42138671875, 6.66656494140625, 6.9117431640625, 7.15692138671875, 7.402099609375, 7.64727783203125, 7.8924560546875, 8.13763427734375, 8.3828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 5.0, 6.0, 14.0, 18.0, 16.0, 21.0, 28.0, 33.0, 33.0, 26.0, 35.0, 30.0, 63.0, 49.0, 57.0, 42.0, 53.0, 55.0, 55.0, 49.0, 50.0, 47.0, 43.0, 29.0, 29.0, 22.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0], "bins": [-6.80078125, -6.626708984375, -6.45263671875, -6.278564453125, -6.1044921875, -5.930419921875, -5.75634765625, -5.582275390625, -5.408203125, -5.234130859375, -5.06005859375, -4.885986328125, -4.7119140625, -4.537841796875, -4.36376953125, -4.189697265625, -4.015625, -3.841552734375, -3.66748046875, -3.493408203125, -3.3193359375, -3.145263671875, -2.97119140625, -2.797119140625, -2.623046875, -2.448974609375, -2.27490234375, -2.100830078125, -1.9267578125, -1.752685546875, -1.57861328125, -1.404541015625, -1.23046875, -1.056396484375, -0.88232421875, -0.708251953125, -0.5341796875, -0.360107421875, -0.18603515625, -0.011962890625, 0.162109375, 0.336181640625, 0.51025390625, 0.684326171875, 0.8583984375, 1.032470703125, 1.20654296875, 1.380615234375, 1.5546875, 1.728759765625, 1.90283203125, 2.076904296875, 2.2509765625, 2.425048828125, 2.59912109375, 2.773193359375, 2.947265625, 3.121337890625, 3.29541015625, 3.469482421875, 3.6435546875, 3.817626953125, 3.99169921875, 4.165771484375, 4.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 2.0, 11.0, 15.0, 14.0, 26.0, 40.0, 46.0, 67.0, 103.0, 180.0, 292.0, 613.0, 1479.0, 4719.0, 19698.0, 156823.0, 778738.0, 68643.0, 11734.0, 3034.0, 1084.0, 477.0, 253.0, 127.0, 94.0, 69.0, 37.0, 33.0, 24.0, 19.0, 8.0, 13.0, 8.0, 5.0, 3.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.943359375, -2.852325439453125, -2.76129150390625, -2.670257568359375, -2.5792236328125, -2.488189697265625, -2.39715576171875, -2.306121826171875, -2.215087890625, -2.124053955078125, -2.03302001953125, -1.941986083984375, -1.8509521484375, -1.759918212890625, -1.66888427734375, -1.577850341796875, -1.48681640625, -1.395782470703125, -1.30474853515625, -1.213714599609375, -1.1226806640625, -1.031646728515625, -0.94061279296875, -0.849578857421875, -0.758544921875, -0.667510986328125, -0.57647705078125, -0.485443115234375, -0.3944091796875, -0.303375244140625, -0.21234130859375, -0.121307373046875, -0.0302734375, 0.060760498046875, 0.15179443359375, 0.242828369140625, 0.3338623046875, 0.424896240234375, 0.51593017578125, 0.606964111328125, 0.697998046875, 0.789031982421875, 0.88006591796875, 0.971099853515625, 1.0621337890625, 1.153167724609375, 1.24420166015625, 1.335235595703125, 1.42626953125, 1.517303466796875, 1.60833740234375, 1.699371337890625, 1.7904052734375, 1.881439208984375, 1.97247314453125, 2.063507080078125, 2.154541015625, 2.245574951171875, 2.33660888671875, 2.427642822265625, 2.5186767578125, 2.609710693359375, 2.70074462890625, 2.791778564453125, 2.8828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 5.0, 6.0, 8.0, 13.0, 15.0, 6.0, 31.0, 34.0, 22.0, 28.0, 41.0, 60.0, 84.0, 139.0, 119.0, 93.0, 59.0, 48.0, 31.0, 23.0, 24.0, 17.0, 16.0, 11.0, 9.0, 12.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003898143768310547, -0.00037755072116851807, -0.00036528706550598145, -0.0003530234098434448, -0.0003407597541809082, -0.0003284960985183716, -0.00031623244285583496, -0.00030396878719329834, -0.0002917051315307617, -0.0002794414758682251, -0.0002671778202056885, -0.00025491416454315186, -0.00024265050888061523, -0.0002303868532180786, -0.000218123197555542, -0.00020585954189300537, -0.00019359588623046875, -0.00018133223056793213, -0.0001690685749053955, -0.0001568049192428589, -0.00014454126358032227, -0.00013227760791778564, -0.00012001395225524902, -0.0001077502965927124, -9.548664093017578e-05, -8.322298526763916e-05, -7.095932960510254e-05, -5.869567394256592e-05, -4.64320182800293e-05, -3.4168362617492676e-05, -2.1904706954956055e-05, -9.641051292419434e-06, 2.6226043701171875e-06, 1.4886260032653809e-05, 2.714991569519043e-05, 3.941357135772705e-05, 5.167722702026367e-05, 6.394088268280029e-05, 7.620453834533691e-05, 8.846819400787354e-05, 0.00010073184967041016, 0.00011299550533294678, 0.0001252591609954834, 0.00013752281665802002, 0.00014978647232055664, 0.00016205012798309326, 0.00017431378364562988, 0.0001865774393081665, 0.00019884109497070312, 0.00021110475063323975, 0.00022336840629577637, 0.000235632061958313, 0.0002478957176208496, 0.00026015937328338623, 0.00027242302894592285, 0.00028468668460845947, 0.0002969503402709961, 0.0003092139959335327, 0.00032147765159606934, 0.00033374130725860596, 0.0003460049629211426, 0.0003582686185836792, 0.0003705322742462158, 0.00038279592990875244, 0.00039505958557128906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 7.0, 20.0, 30.0, 33.0, 66.0, 78.0, 116.0, 198.0, 314.0, 532.0, 999.0, 2264.0, 6353.0, 31036.0, 363829.0, 587868.0, 41781.0, 7665.0, 2570.0, 1180.0, 618.0, 336.0, 211.0, 143.0, 86.0, 62.0, 37.0, 25.0, 23.0, 10.0, 14.0, 9.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.857421875, -2.771026611328125, -2.68463134765625, -2.598236083984375, -2.5118408203125, -2.425445556640625, -2.33905029296875, -2.252655029296875, -2.166259765625, -2.079864501953125, -1.99346923828125, -1.907073974609375, -1.8206787109375, -1.734283447265625, -1.64788818359375, -1.561492919921875, -1.47509765625, -1.388702392578125, -1.30230712890625, -1.215911865234375, -1.1295166015625, -1.043121337890625, -0.95672607421875, -0.870330810546875, -0.783935546875, -0.697540283203125, -0.61114501953125, -0.524749755859375, -0.4383544921875, -0.351959228515625, -0.26556396484375, -0.179168701171875, -0.0927734375, -0.006378173828125, 0.08001708984375, 0.166412353515625, 0.2528076171875, 0.339202880859375, 0.42559814453125, 0.511993408203125, 0.598388671875, 0.684783935546875, 0.77117919921875, 0.857574462890625, 0.9439697265625, 1.030364990234375, 1.11676025390625, 1.203155517578125, 1.28955078125, 1.375946044921875, 1.46234130859375, 1.548736572265625, 1.6351318359375, 1.721527099609375, 1.80792236328125, 1.894317626953125, 1.980712890625, 2.067108154296875, 2.15350341796875, 2.239898681640625, 2.3262939453125, 2.412689208984375, 2.49908447265625, 2.585479736328125, 2.671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 6.0, 6.0, 12.0, 8.0, 21.0, 21.0, 16.0, 34.0, 41.0, 61.0, 67.0, 62.0, 95.0, 84.0, 62.0, 67.0, 59.0, 52.0, 45.0, 34.0, 19.0, 24.0, 11.0, 20.0, 10.0, 10.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80078125, -1.7453460693359375, -1.689910888671875, -1.6344757080078125, -1.57904052734375, -1.5236053466796875, -1.468170166015625, -1.4127349853515625, -1.3572998046875, -1.3018646240234375, -1.246429443359375, -1.1909942626953125, -1.13555908203125, -1.0801239013671875, -1.024688720703125, -0.9692535400390625, -0.913818359375, -0.8583831787109375, -0.802947998046875, -0.7475128173828125, -0.69207763671875, -0.6366424560546875, -0.581207275390625, -0.5257720947265625, -0.4703369140625, -0.4149017333984375, -0.359466552734375, -0.3040313720703125, -0.24859619140625, -0.1931610107421875, -0.137725830078125, -0.0822906494140625, -0.02685546875, 0.0285797119140625, 0.084014892578125, 0.1394500732421875, 0.19488525390625, 0.2503204345703125, 0.305755615234375, 0.3611907958984375, 0.4166259765625, 0.4720611572265625, 0.527496337890625, 0.5829315185546875, 0.63836669921875, 0.6938018798828125, 0.749237060546875, 0.8046722412109375, 0.860107421875, 0.9155426025390625, 0.970977783203125, 1.0264129638671875, 1.08184814453125, 1.1372833251953125, 1.192718505859375, 1.2481536865234375, 1.3035888671875, 1.3590240478515625, 1.414459228515625, 1.4698944091796875, 1.52532958984375, 1.5807647705078125, 1.636199951171875, 1.6916351318359375, 1.7470703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 10.0, 23.0, 47.0, 95.0, 168.0, 197.0, 173.0, 120.0, 78.0, 31.0, 19.0, 10.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.984535217285156, -36.55978775024414, -35.135040283203125, -33.710296630859375, -32.28554916381836, -30.860801696777344, -29.436054229736328, -28.011306762695312, -26.58656120300293, -25.161813735961914, -23.73706817626953, -22.312320709228516, -20.8875732421875, -19.462827682495117, -18.0380802154541, -16.61333465576172, -15.188587188720703, -13.763840675354004, -12.339094161987305, -10.914346694946289, -9.48960018157959, -8.06485366821289, -6.640106201171875, -5.215359687805176, -3.7906131744384766, -2.3658664226531982, -0.9411196708679199, 0.4836273193359375, 1.9083738327026367, 3.333120346069336, 4.757867813110352, 6.182614326477051, 7.607357025146484, 9.032103538513184, 10.456850051879883, 11.881597518920898, 13.306344032287598, 14.731090545654297, 16.155838012695312, 17.580585479736328, 19.00533103942871, 20.430078506469727, 21.85482406616211, 23.279571533203125, 24.70431900024414, 26.129064559936523, 27.55381202697754, 28.978557586669922, 30.403305053710938, 31.828052520751953, 33.25279998779297, 34.67754364013672, 36.102291107177734, 37.52703857421875, 38.951786041259766, 40.37653350830078, 41.80127716064453, 43.22602462768555, 44.65077209472656, 46.07551574707031, 47.50026321411133, 48.925010681152344, 50.34975814819336, 51.774505615234375, 53.19925308227539]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 12.0, 14.0, 9.0, 15.0, 9.0, 25.0, 25.0, 27.0, 29.0, 44.0, 33.0, 42.0, 65.0, 61.0, 61.0, 45.0, 54.0, 55.0, 52.0, 37.0, 38.0, 35.0, 29.0, 23.0, 18.0, 15.0, 32.0, 14.0, 12.0, 10.0, 9.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.62863540649414, -22.978681564331055, -22.32872772216797, -21.67877197265625, -21.028818130493164, -20.378864288330078, -19.72890853881836, -19.078954696655273, -18.429000854492188, -17.7790470123291, -17.129093170166016, -16.479137420654297, -15.829183578491211, -15.179229736328125, -14.529274940490723, -13.87932014465332, -13.229366302490234, -12.579412460327148, -11.929457664489746, -11.279502868652344, -10.629549026489258, -9.979595184326172, -9.32964038848877, -8.679685592651367, -8.029731750488281, -7.379777431488037, -6.729823112487793, -6.079868793487549, -5.429914474487305, -4.7799601554870605, -4.130005836486816, -3.4800515174865723, -2.830097198486328, -2.180142879486084, -1.5301885604858398, -0.8802342414855957, -0.23027992248535156, 0.4196743965148926, 1.0696287155151367, 1.7195830345153809, 2.369537353515625, 3.019491672515869, 3.6694459915161133, 4.319400310516357, 4.969354629516602, 5.619308948516846, 6.26926326751709, 6.919217586517334, 7.569171905517578, 8.219125747680664, 8.869080543518066, 9.519035339355469, 10.168989181518555, 10.81894302368164, 11.468897819519043, 12.118852615356445, 12.768806457519531, 13.418760299682617, 14.06871509552002, 14.718669891357422, 15.368623733520508, 16.018577575683594, 16.668533325195312, 17.3184871673584, 17.968441009521484]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 8.0, 10.0, 11.0, 19.0, 12.0, 18.0, 26.0, 36.0, 46.0, 65.0, 84.0, 98.0, 165.0, 266.0, 689.0, 3937.0, 115805.0, 4045137.0, 24821.0, 1830.0, 468.0, 209.0, 133.0, 81.0, 68.0, 53.0, 36.0, 42.0, 24.0, 12.0, 20.0, 13.0, 14.0, 13.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.24505615234375, -6.9471435546875, -6.64923095703125, -6.351318359375, -6.05340576171875, -5.7554931640625, -5.45758056640625, -5.15966796875, -4.86175537109375, -4.5638427734375, -4.26593017578125, -3.968017578125, -3.67010498046875, -3.3721923828125, -3.07427978515625, -2.7763671875, -2.47845458984375, -2.1805419921875, -1.88262939453125, -1.584716796875, -1.28680419921875, -0.9888916015625, -0.69097900390625, -0.39306640625, -0.09515380859375, 0.2027587890625, 0.50067138671875, 0.798583984375, 1.09649658203125, 1.3944091796875, 1.69232177734375, 1.990234375, 2.28814697265625, 2.5860595703125, 2.88397216796875, 3.181884765625, 3.47979736328125, 3.7777099609375, 4.07562255859375, 4.37353515625, 4.67144775390625, 4.9693603515625, 5.26727294921875, 5.565185546875, 5.86309814453125, 6.1610107421875, 6.45892333984375, 6.7568359375, 7.05474853515625, 7.3526611328125, 7.65057373046875, 7.948486328125, 8.24639892578125, 8.5443115234375, 8.84222412109375, 9.14013671875, 9.43804931640625, 9.7359619140625, 10.03387451171875, 10.331787109375, 10.62969970703125, 10.9276123046875, 11.22552490234375, 11.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 10.0, 16.0, 21.0, 30.0, 32.0, 36.0, 56.0, 66.0, 70.0, 85.0, 92.0, 79.0, 88.0, 64.0, 58.0, 51.0, 46.0, 35.0, 21.0, 16.0, 14.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.817962646484375, -1.75701904296875, -1.696075439453125, -1.6351318359375, -1.574188232421875, -1.51324462890625, -1.452301025390625, -1.391357421875, -1.330413818359375, -1.26947021484375, -1.208526611328125, -1.1475830078125, -1.086639404296875, -1.02569580078125, -0.964752197265625, -0.90380859375, -0.842864990234375, -0.78192138671875, -0.720977783203125, -0.6600341796875, -0.599090576171875, -0.53814697265625, -0.477203369140625, -0.416259765625, -0.355316162109375, -0.29437255859375, -0.233428955078125, -0.1724853515625, -0.111541748046875, -0.05059814453125, 0.010345458984375, 0.0712890625, 0.132232666015625, 0.19317626953125, 0.254119873046875, 0.3150634765625, 0.376007080078125, 0.43695068359375, 0.497894287109375, 0.558837890625, 0.619781494140625, 0.68072509765625, 0.741668701171875, 0.8026123046875, 0.863555908203125, 0.92449951171875, 0.985443115234375, 1.04638671875, 1.107330322265625, 1.16827392578125, 1.229217529296875, 1.2901611328125, 1.351104736328125, 1.41204833984375, 1.472991943359375, 1.533935546875, 1.594879150390625, 1.65582275390625, 1.716766357421875, 1.7777099609375, 1.838653564453125, 1.89959716796875, 1.960540771484375, 2.021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 14.0, 19.0, 30.0, 37.0, 71.0, 128.0, 231.0, 421.0, 963.0, 2496.0, 6415.0, 19470.0, 85813.0, 1499115.0, 2435201.0, 109409.0, 22786.0, 7083.0, 2580.0, 1057.0, 455.0, 219.0, 107.0, 68.0, 23.0, 15.0, 18.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.782379150390625, -3.65655517578125, -3.530731201171875, -3.4049072265625, -3.279083251953125, -3.15325927734375, -3.027435302734375, -2.901611328125, -2.775787353515625, -2.64996337890625, -2.524139404296875, -2.3983154296875, -2.272491455078125, -2.14666748046875, -2.020843505859375, -1.89501953125, -1.769195556640625, -1.64337158203125, -1.517547607421875, -1.3917236328125, -1.265899658203125, -1.14007568359375, -1.014251708984375, -0.888427734375, -0.762603759765625, -0.63677978515625, -0.510955810546875, -0.3851318359375, -0.259307861328125, -0.13348388671875, -0.007659912109375, 0.1181640625, 0.243988037109375, 0.36981201171875, 0.495635986328125, 0.6214599609375, 0.747283935546875, 0.87310791015625, 0.998931884765625, 1.124755859375, 1.250579833984375, 1.37640380859375, 1.502227783203125, 1.6280517578125, 1.753875732421875, 1.87969970703125, 2.005523681640625, 2.13134765625, 2.257171630859375, 2.38299560546875, 2.508819580078125, 2.6346435546875, 2.760467529296875, 2.88629150390625, 3.012115478515625, 3.137939453125, 3.263763427734375, 3.38958740234375, 3.515411376953125, 3.6412353515625, 3.767059326171875, 3.89288330078125, 4.018707275390625, 4.14453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 15.0, 8.0, 7.0, 13.0, 28.0, 39.0, 37.0, 65.0, 106.0, 180.0, 346.0, 704.0, 1064.0, 631.0, 300.0, 171.0, 105.0, 69.0, 50.0, 30.0, 21.0, 16.0, 18.0, 7.0, 10.0, 5.0, 1.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.44921875, -4.339202880859375, -4.22918701171875, -4.119171142578125, -4.0091552734375, -3.899139404296875, -3.78912353515625, -3.679107666015625, -3.569091796875, -3.459075927734375, -3.34906005859375, -3.239044189453125, -3.1290283203125, -3.019012451171875, -2.90899658203125, -2.798980712890625, -2.68896484375, -2.578948974609375, -2.46893310546875, -2.358917236328125, -2.2489013671875, -2.138885498046875, -2.02886962890625, -1.918853759765625, -1.808837890625, -1.698822021484375, -1.58880615234375, -1.478790283203125, -1.3687744140625, -1.258758544921875, -1.14874267578125, -1.038726806640625, -0.9287109375, -0.818695068359375, -0.70867919921875, -0.598663330078125, -0.4886474609375, -0.378631591796875, -0.26861572265625, -0.158599853515625, -0.048583984375, 0.061431884765625, 0.17144775390625, 0.281463623046875, 0.3914794921875, 0.501495361328125, 0.61151123046875, 0.721527099609375, 0.83154296875, 0.941558837890625, 1.05157470703125, 1.161590576171875, 1.2716064453125, 1.381622314453125, 1.49163818359375, 1.601654052734375, 1.711669921875, 1.821685791015625, 1.93170166015625, 2.041717529296875, 2.1517333984375, 2.261749267578125, 2.37176513671875, 2.481781005859375, 2.591796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 14.0, 33.0, 62.0, 105.0, 173.0, 203.0, 169.0, 94.0, 59.0, 31.0, 19.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.61330795288086, -36.37720489501953, -35.14110565185547, -33.90500259399414, -32.66890335083008, -31.43280029296875, -30.196699142456055, -28.96059799194336, -27.724496841430664, -26.48839569091797, -25.252294540405273, -24.016193389892578, -22.78009033203125, -21.543991088867188, -20.30788803100586, -19.071786880493164, -17.83568572998047, -16.599584579467773, -15.363483428955078, -14.127381324768066, -12.891280174255371, -11.655179023742676, -10.419076919555664, -9.182975769042969, -7.946874618530273, -6.710773468017578, -5.474671840667725, -4.238570213317871, -3.002469062805176, -1.7663679122924805, -0.530266284942627, 0.7058353424072266, 1.9419326782226562, 3.1780340671539307, 4.414135456085205, 5.650237083435059, 6.886338233947754, 8.12243938446045, 9.358541488647461, 10.594642639160156, 11.830743789672852, 13.066844940185547, 14.302946090698242, 15.539048194885254, 16.775150299072266, 18.011249542236328, 19.247352600097656, 20.48345375061035, 21.719554901123047, 22.955656051635742, 24.191757202148438, 25.427858352661133, 26.663959503173828, 27.900062561035156, 29.13616371154785, 30.372264862060547, 31.608366012573242, 32.84446716308594, 34.080570220947266, 35.31666946411133, 36.552772521972656, 37.78887176513672, 39.02497482299805, 40.261077880859375, 41.49717712402344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 15.0, 12.0, 16.0, 14.0, 15.0, 15.0, 16.0, 18.0, 31.0, 32.0, 32.0, 30.0, 43.0, 36.0, 50.0, 50.0, 41.0, 56.0, 38.0, 46.0, 37.0, 41.0, 33.0, 46.0, 29.0, 27.0, 26.0, 21.0, 18.0, 18.0, 14.0, 14.0, 14.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.32772159576416, -12.853902816772461, -12.380084037780762, -11.906265258789062, -11.43244743347168, -10.95862865447998, -10.484809875488281, -10.010991096496582, -9.537172317504883, -9.063353538513184, -8.589534759521484, -8.115716934204102, -7.641898155212402, -7.168079376220703, -6.694260597229004, -6.220441818237305, -5.746623992919922, -5.272805213928223, -4.798986911773682, -4.325168132781982, -3.8513495922088623, -3.377531051635742, -2.903712272644043, -2.429893732070923, -1.9560751914978027, -1.4822566509246826, -1.008437991142273, -0.5346193313598633, -0.060800790786743164, 0.41301774978637695, 0.8868365287780762, 1.3606550693511963, 1.83447265625, 2.30829119682312, 2.7821097373962402, 3.2559285163879395, 3.7297470569610596, 4.20356559753418, 4.677384376525879, 5.151203155517578, 5.625021457672119, 6.098840236663818, 6.572658538818359, 7.046477317810059, 7.520296096801758, 7.994114398956299, 8.467933654785156, 8.941751480102539, 9.415570259094238, 9.889389038085938, 10.363207817077637, 10.837026596069336, 11.310844421386719, 11.784663200378418, 12.258481979370117, 12.732300758361816, 13.206119537353516, 13.679938316345215, 14.153757095336914, 14.627574920654297, 15.101393699645996, 15.575212478637695, 16.049030303955078, 16.522850036621094, 16.996667861938477]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 13.0, 22.0, 21.0, 30.0, 41.0, 63.0, 92.0, 138.0, 211.0, 352.0, 583.0, 926.0, 1595.0, 2833.0, 5261.0, 9863.0, 19293.0, 39702.0, 86029.0, 201748.0, 338135.0, 186943.0, 79315.0, 36309.0, 17959.0, 9447.0, 4895.0, 2789.0, 1501.0, 930.0, 529.0, 327.0, 218.0, 139.0, 99.0, 58.0, 36.0, 24.0, 21.0, 15.0, 14.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.318359375, -2.246917724609375, -2.17547607421875, -2.104034423828125, -2.0325927734375, -1.961151123046875, -1.88970947265625, -1.818267822265625, -1.746826171875, -1.675384521484375, -1.60394287109375, -1.532501220703125, -1.4610595703125, -1.389617919921875, -1.31817626953125, -1.246734619140625, -1.17529296875, -1.103851318359375, -1.03240966796875, -0.960968017578125, -0.8895263671875, -0.818084716796875, -0.74664306640625, -0.675201416015625, -0.603759765625, -0.532318115234375, -0.46087646484375, -0.389434814453125, -0.3179931640625, -0.246551513671875, -0.17510986328125, -0.103668212890625, -0.0322265625, 0.039215087890625, 0.11065673828125, 0.182098388671875, 0.2535400390625, 0.324981689453125, 0.39642333984375, 0.467864990234375, 0.539306640625, 0.610748291015625, 0.68218994140625, 0.753631591796875, 0.8250732421875, 0.896514892578125, 0.96795654296875, 1.039398193359375, 1.11083984375, 1.182281494140625, 1.25372314453125, 1.325164794921875, 1.3966064453125, 1.468048095703125, 1.53948974609375, 1.610931396484375, 1.682373046875, 1.753814697265625, 1.82525634765625, 1.896697998046875, 1.9681396484375, 2.039581298828125, 2.11102294921875, 2.182464599609375, 2.25390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 14.0, 19.0, 14.0, 14.0, 36.0, 51.0, 49.0, 57.0, 48.0, 65.0, 67.0, 71.0, 78.0, 67.0, 71.0, 48.0, 51.0, 46.0, 27.0, 34.0, 14.0, 18.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.624908447265625, -1.56622314453125, -1.507537841796875, -1.4488525390625, -1.390167236328125, -1.33148193359375, -1.272796630859375, -1.214111328125, -1.155426025390625, -1.09674072265625, -1.038055419921875, -0.9793701171875, -0.920684814453125, -0.86199951171875, -0.803314208984375, -0.74462890625, -0.685943603515625, -0.62725830078125, -0.568572998046875, -0.5098876953125, -0.451202392578125, -0.39251708984375, -0.333831787109375, -0.275146484375, -0.216461181640625, -0.15777587890625, -0.099090576171875, -0.0404052734375, 0.018280029296875, 0.07696533203125, 0.135650634765625, 0.1943359375, 0.253021240234375, 0.31170654296875, 0.370391845703125, 0.4290771484375, 0.487762451171875, 0.54644775390625, 0.605133056640625, 0.663818359375, 0.722503662109375, 0.78118896484375, 0.839874267578125, 0.8985595703125, 0.957244873046875, 1.01593017578125, 1.074615478515625, 1.13330078125, 1.191986083984375, 1.25067138671875, 1.309356689453125, 1.3680419921875, 1.426727294921875, 1.48541259765625, 1.544097900390625, 1.602783203125, 1.661468505859375, 1.72015380859375, 1.778839111328125, 1.8375244140625, 1.896209716796875, 1.95489501953125, 2.013580322265625, 2.072265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 15.0, 16.0, 15.0, 28.0, 37.0, 39.0, 60.0, 124.0, 182.0, 277.0, 529.0, 933.0, 2159.0, 6042.0, 22861.0, 134559.0, 712187.0, 135110.0, 22882.0, 6044.0, 2170.0, 963.0, 493.0, 288.0, 159.0, 104.0, 69.0, 66.0, 33.0, 27.0, 19.0, 8.0, 15.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.28125, -5.10223388671875, -4.9232177734375, -4.74420166015625, -4.565185546875, -4.38616943359375, -4.2071533203125, -4.02813720703125, -3.84912109375, -3.67010498046875, -3.4910888671875, -3.31207275390625, -3.133056640625, -2.95404052734375, -2.7750244140625, -2.59600830078125, -2.4169921875, -2.23797607421875, -2.0589599609375, -1.87994384765625, -1.700927734375, -1.52191162109375, -1.3428955078125, -1.16387939453125, -0.98486328125, -0.80584716796875, -0.6268310546875, -0.44781494140625, -0.268798828125, -0.08978271484375, 0.0892333984375, 0.26824951171875, 0.447265625, 0.62628173828125, 0.8052978515625, 0.98431396484375, 1.163330078125, 1.34234619140625, 1.5213623046875, 1.70037841796875, 1.87939453125, 2.05841064453125, 2.2374267578125, 2.41644287109375, 2.595458984375, 2.77447509765625, 2.9534912109375, 3.13250732421875, 3.3115234375, 3.49053955078125, 3.6695556640625, 3.84857177734375, 4.027587890625, 4.20660400390625, 4.3856201171875, 4.56463623046875, 4.74365234375, 4.92266845703125, 5.1016845703125, 5.28070068359375, 5.459716796875, 5.63873291015625, 5.8177490234375, 5.99676513671875, 6.17578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 2.0, 11.0, 12.0, 17.0, 23.0, 31.0, 41.0, 60.0, 70.0, 88.0, 92.0, 95.0, 82.0, 85.0, 71.0, 54.0, 36.0, 46.0, 27.0, 17.0, 14.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.517822265625, -9.20751953125, -8.897216796875, -8.5869140625, -8.276611328125, -7.96630859375, -7.656005859375, -7.345703125, -7.035400390625, -6.72509765625, -6.414794921875, -6.1044921875, -5.794189453125, -5.48388671875, -5.173583984375, -4.86328125, -4.552978515625, -4.24267578125, -3.932373046875, -3.6220703125, -3.311767578125, -3.00146484375, -2.691162109375, -2.380859375, -2.070556640625, -1.76025390625, -1.449951171875, -1.1396484375, -0.829345703125, -0.51904296875, -0.208740234375, 0.1015625, 0.411865234375, 0.72216796875, 1.032470703125, 1.3427734375, 1.653076171875, 1.96337890625, 2.273681640625, 2.583984375, 2.894287109375, 3.20458984375, 3.514892578125, 3.8251953125, 4.135498046875, 4.44580078125, 4.756103515625, 5.06640625, 5.376708984375, 5.68701171875, 5.997314453125, 6.3076171875, 6.617919921875, 6.92822265625, 7.238525390625, 7.548828125, 7.859130859375, 8.16943359375, 8.479736328125, 8.7900390625, 9.100341796875, 9.41064453125, 9.720947265625, 10.03125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 15.0, 19.0, 43.0, 86.0, 216.0, 697.0, 3228.0, 46293.0, 953096.0, 40905.0, 2885.0, 615.0, 213.0, 98.0, 47.0, 35.0, 17.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.63092041015625, -4.4337158203125, -4.23651123046875, -4.039306640625, -3.84210205078125, -3.6448974609375, -3.44769287109375, -3.25048828125, -3.05328369140625, -2.8560791015625, -2.65887451171875, -2.461669921875, -2.26446533203125, -2.0672607421875, -1.87005615234375, -1.6728515625, -1.47564697265625, -1.2784423828125, -1.08123779296875, -0.884033203125, -0.68682861328125, -0.4896240234375, -0.29241943359375, -0.09521484375, 0.10198974609375, 0.2991943359375, 0.49639892578125, 0.693603515625, 0.89080810546875, 1.0880126953125, 1.28521728515625, 1.482421875, 1.67962646484375, 1.8768310546875, 2.07403564453125, 2.271240234375, 2.46844482421875, 2.6656494140625, 2.86285400390625, 3.06005859375, 3.25726318359375, 3.4544677734375, 3.65167236328125, 3.848876953125, 4.04608154296875, 4.2432861328125, 4.44049072265625, 4.6376953125, 4.83489990234375, 5.0321044921875, 5.22930908203125, 5.426513671875, 5.62371826171875, 5.8209228515625, 6.01812744140625, 6.21533203125, 6.41253662109375, 6.6097412109375, 6.80694580078125, 7.004150390625, 7.20135498046875, 7.3985595703125, 7.59576416015625, 7.79296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 10.0, 8.0, 14.0, 16.0, 24.0, 35.0, 42.0, 44.0, 61.0, 80.0, 117.0, 102.0, 108.0, 58.0, 38.0, 56.0, 36.0, 26.0, 28.0, 15.0, 14.0, 7.0, 8.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00039577484130859375, -0.00038354843854904175, -0.00037132203578948975, -0.00035909563302993774, -0.00034686923027038574, -0.00033464282751083374, -0.00032241642475128174, -0.00031019002199172974, -0.00029796361923217773, -0.00028573721647262573, -0.00027351081371307373, -0.00026128441095352173, -0.0002490580081939697, -0.00023683160543441772, -0.00022460520267486572, -0.00021237879991531372, -0.00020015239715576172, -0.00018792599439620972, -0.00017569959163665771, -0.0001634731888771057, -0.0001512467861175537, -0.0001390203833580017, -0.0001267939805984497, -0.0001145675778388977, -0.0001023411750793457, -9.01147723197937e-05, -7.78883695602417e-05, -6.56619668006897e-05, -5.3435564041137695e-05, -4.120916128158569e-05, -2.898275852203369e-05, -1.675635576248169e-05, -4.5299530029296875e-06, 7.696449756622314e-06, 1.9922852516174316e-05, 3.214925527572632e-05, 4.437565803527832e-05, 5.660206079483032e-05, 6.882846355438232e-05, 8.105486631393433e-05, 9.328126907348633e-05, 0.00010550767183303833, 0.00011773407459259033, 0.00012996047735214233, 0.00014218688011169434, 0.00015441328287124634, 0.00016663968563079834, 0.00017886608839035034, 0.00019109249114990234, 0.00020331889390945435, 0.00021554529666900635, 0.00022777169942855835, 0.00023999810218811035, 0.00025222450494766235, 0.00026445090770721436, 0.00027667731046676636, 0.00028890371322631836, 0.00030113011598587036, 0.00031335651874542236, 0.00032558292150497437, 0.00033780932426452637, 0.00035003572702407837, 0.00036226212978363037, 0.0003744885325431824, 0.0003867149353027344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 9.0, 18.0, 21.0, 32.0, 71.0, 152.0, 361.0, 985.0, 3197.0, 21415.0, 761729.0, 246767.0, 10452.0, 2098.0, 680.0, 291.0, 108.0, 65.0, 41.0, 16.0, 13.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.68359375, -5.54095458984375, -5.3983154296875, -5.25567626953125, -5.113037109375, -4.97039794921875, -4.8277587890625, -4.68511962890625, -4.54248046875, -4.39984130859375, -4.2572021484375, -4.11456298828125, -3.971923828125, -3.82928466796875, -3.6866455078125, -3.54400634765625, -3.4013671875, -3.25872802734375, -3.1160888671875, -2.97344970703125, -2.830810546875, -2.68817138671875, -2.5455322265625, -2.40289306640625, -2.26025390625, -2.11761474609375, -1.9749755859375, -1.83233642578125, -1.689697265625, -1.54705810546875, -1.4044189453125, -1.26177978515625, -1.119140625, -0.97650146484375, -0.8338623046875, -0.69122314453125, -0.548583984375, -0.40594482421875, -0.2633056640625, -0.12066650390625, 0.02197265625, 0.16461181640625, 0.3072509765625, 0.44989013671875, 0.592529296875, 0.73516845703125, 0.8778076171875, 1.02044677734375, 1.1630859375, 1.30572509765625, 1.4483642578125, 1.59100341796875, 1.733642578125, 1.87628173828125, 2.0189208984375, 2.16156005859375, 2.30419921875, 2.44683837890625, 2.5894775390625, 2.73211669921875, 2.874755859375, 3.01739501953125, 3.1600341796875, 3.30267333984375, 3.4453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 13.0, 12.0, 14.0, 31.0, 57.0, 53.0, 80.0, 112.0, 117.0, 143.0, 113.0, 65.0, 62.0, 47.0, 30.0, 18.0, 10.0, 3.0, 4.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -1.987884521484375, -1.88787841796875, -1.787872314453125, -1.6878662109375, -1.587860107421875, -1.48785400390625, -1.387847900390625, -1.287841796875, -1.187835693359375, -1.08782958984375, -0.987823486328125, -0.8878173828125, -0.787811279296875, -0.68780517578125, -0.587799072265625, -0.48779296875, -0.387786865234375, -0.28778076171875, -0.187774658203125, -0.0877685546875, 0.012237548828125, 0.11224365234375, 0.212249755859375, 0.312255859375, 0.412261962890625, 0.51226806640625, 0.612274169921875, 0.7122802734375, 0.812286376953125, 0.91229248046875, 1.012298583984375, 1.1123046875, 1.212310791015625, 1.31231689453125, 1.412322998046875, 1.5123291015625, 1.612335205078125, 1.71234130859375, 1.812347412109375, 1.912353515625, 2.012359619140625, 2.11236572265625, 2.212371826171875, 2.3123779296875, 2.412384033203125, 2.51239013671875, 2.612396240234375, 2.71240234375, 2.812408447265625, 2.91241455078125, 3.012420654296875, 3.1124267578125, 3.212432861328125, 3.31243896484375, 3.412445068359375, 3.512451171875, 3.612457275390625, 3.71246337890625, 3.812469482421875, 3.9124755859375, 4.012481689453125, 4.11248779296875, 4.212493896484375, 4.3125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 9.0, 14.0, 29.0, 47.0, 125.0, 164.0, 190.0, 174.0, 99.0, 68.0, 37.0, 17.0, 10.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28925323486328, -53.89160919189453, -52.49396514892578, -51.0963249206543, -49.69868087768555, -48.3010368347168, -46.90339660644531, -45.50575256347656, -44.10810852050781, -42.71046447753906, -41.31282043457031, -39.91518020629883, -38.51753616333008, -37.11989212036133, -35.722251892089844, -34.324607849121094, -32.926963806152344, -31.529319763183594, -30.131677627563477, -28.73403549194336, -27.33639144897461, -25.93874740600586, -24.541105270385742, -23.143463134765625, -21.745819091796875, -20.348175048828125, -18.950532913208008, -17.55289077758789, -16.15524673461914, -14.757603645324707, -13.359960556030273, -11.96231746673584, -10.56467056274414, -9.167027473449707, -7.769384384155273, -6.37174129486084, -4.974098205566406, -3.5764551162719727, -2.178812026977539, -0.7811689376831055, 0.6164741516113281, 2.0141172409057617, 3.4117603302001953, 4.809403419494629, 6.2070465087890625, 7.604689598083496, 9.00233268737793, 10.399975776672363, 11.797618865966797, 13.19526195526123, 14.592905044555664, 15.990548133850098, 17.38819122314453, 18.78583526611328, 20.1834774017334, 21.581119537353516, 22.978763580322266, 24.376407623291016, 25.774049758911133, 27.17169189453125, 28.5693359375, 29.96697998046875, 31.364622116088867, 32.762264251708984, 34.159908294677734]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 18.0, 19.0, 41.0, 55.0, 54.0, 82.0, 97.0, 115.0, 133.0, 89.0, 66.0, 70.0, 61.0, 41.0, 22.0, 15.0, 10.0, 12.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.957256317138672, -22.386268615722656, -20.81528091430664, -19.244291305541992, -17.673303604125977, -16.10231590270996, -14.531327247619629, -12.960338592529297, -11.389350891113281, -9.818363189697266, -8.247374534606934, -6.67638635635376, -5.105398178100586, -3.534409999847412, -1.9634218215942383, -0.39243316650390625, 1.1785545349121094, 2.749542713165283, 4.320530891418457, 5.891519069671631, 7.462507247924805, 9.03349494934082, 10.604483604431152, 12.175472259521484, 13.7464599609375, 15.317447662353516, 16.88843536376953, 18.45942497253418, 20.030412673950195, 21.60140037536621, 23.17238998413086, 24.743377685546875, 26.314369201660156, 27.885356903076172, 29.456344604492188, 31.027334213256836, 32.59832000732422, 34.1693115234375, 35.740299224853516, 37.31128692626953, 38.88227462768555, 40.45326232910156, 42.02425003051758, 43.595237731933594, 45.166229248046875, 46.73721694946289, 48.308204650878906, 49.87919235229492, 51.45018005371094, 53.02116775512695, 54.59215545654297, 56.163143157958984, 57.734130859375, 59.30512237548828, 60.8761100769043, 62.44709777832031, 64.01808166503906, 65.58907318115234, 67.1600570678711, 68.73104858398438, 70.30203247070312, 71.8730239868164, 73.44400787353516, 75.01499938964844, 76.58599090576172]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 14.0, 36.0, 83.0, 202.0, 428.0, 905.0, 2563.0, 10956.0, 90508.0, 2741617.0, 1288727.0, 49412.0, 6634.0, 1403.0, 405.0, 148.0, 74.0, 41.0, 28.0, 19.0, 17.0, 16.0, 9.0, 14.0, 5.0, 7.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.12774658203125, -1.9937744140625, -1.85980224609375, -1.725830078125, -1.59185791015625, -1.4578857421875, -1.32391357421875, -1.18994140625, -1.05596923828125, -0.9219970703125, -0.78802490234375, -0.654052734375, -0.52008056640625, -0.3861083984375, -0.25213623046875, -0.1181640625, 0.01580810546875, 0.1497802734375, 0.28375244140625, 0.417724609375, 0.55169677734375, 0.6856689453125, 0.81964111328125, 0.95361328125, 1.08758544921875, 1.2215576171875, 1.35552978515625, 1.489501953125, 1.62347412109375, 1.7574462890625, 1.89141845703125, 2.025390625, 2.15936279296875, 2.2933349609375, 2.42730712890625, 2.561279296875, 2.69525146484375, 2.8292236328125, 2.96319580078125, 3.09716796875, 3.23114013671875, 3.3651123046875, 3.49908447265625, 3.633056640625, 3.76702880859375, 3.9010009765625, 4.03497314453125, 4.1689453125, 4.30291748046875, 4.4368896484375, 4.57086181640625, 4.704833984375, 4.83880615234375, 4.9727783203125, 5.10675048828125, 5.24072265625, 5.37469482421875, 5.5086669921875, 5.64263916015625, 5.776611328125, 5.91058349609375, 6.0445556640625, 6.17852783203125, 6.3125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 11.0, 24.0, 49.0, 122.0, 191.0, 228.0, 186.0, 107.0, 59.0, 30.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.4132080078125, -1.248291015625, -1.0833740234375, -0.91845703125, -0.7535400390625, -0.588623046875, -0.4237060546875, -0.2587890625, -0.0938720703125, 0.071044921875, 0.2359619140625, 0.40087890625, 0.5657958984375, 0.730712890625, 0.8956298828125, 1.060546875, 1.2254638671875, 1.390380859375, 1.5552978515625, 1.72021484375, 1.8851318359375, 2.050048828125, 2.2149658203125, 2.3798828125, 2.5447998046875, 2.709716796875, 2.8746337890625, 3.03955078125, 3.2044677734375, 3.369384765625, 3.5343017578125, 3.69921875, 3.8641357421875, 4.029052734375, 4.1939697265625, 4.35888671875, 4.5238037109375, 4.688720703125, 4.8536376953125, 5.0185546875, 5.1834716796875, 5.348388671875, 5.5133056640625, 5.67822265625, 5.8431396484375, 6.008056640625, 6.1729736328125, 6.337890625, 6.5028076171875, 6.667724609375, 6.8326416015625, 6.99755859375, 7.1624755859375, 7.327392578125, 7.4923095703125, 7.6572265625, 7.8221435546875, 7.987060546875, 8.1519775390625, 8.31689453125, 8.4818115234375, 8.646728515625, 8.8116455078125, 8.9765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 7.0, 10.0, 13.0, 8.0, 20.0, 40.0, 61.0, 76.0, 151.0, 273.0, 535.0, 1129.0, 2704.0, 7292.0, 24422.0, 117045.0, 1715388.0, 2154533.0, 132468.0, 26125.0, 7246.0, 2619.0, 1061.0, 480.0, 250.0, 150.0, 58.0, 43.0, 20.0, 13.0, 8.0, 9.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.70855712890625, -3.5850830078125, -3.46160888671875, -3.338134765625, -3.21466064453125, -3.0911865234375, -2.96771240234375, -2.84423828125, -2.72076416015625, -2.5972900390625, -2.47381591796875, -2.350341796875, -2.22686767578125, -2.1033935546875, -1.97991943359375, -1.8564453125, -1.73297119140625, -1.6094970703125, -1.48602294921875, -1.362548828125, -1.23907470703125, -1.1156005859375, -0.99212646484375, -0.86865234375, -0.74517822265625, -0.6217041015625, -0.49822998046875, -0.374755859375, -0.25128173828125, -0.1278076171875, -0.00433349609375, 0.119140625, 0.24261474609375, 0.3660888671875, 0.48956298828125, 0.613037109375, 0.73651123046875, 0.8599853515625, 0.98345947265625, 1.10693359375, 1.23040771484375, 1.3538818359375, 1.47735595703125, 1.600830078125, 1.72430419921875, 1.8477783203125, 1.97125244140625, 2.0947265625, 2.21820068359375, 2.3416748046875, 2.46514892578125, 2.588623046875, 2.71209716796875, 2.8355712890625, 2.95904541015625, 3.08251953125, 3.20599365234375, 3.3294677734375, 3.45294189453125, 3.576416015625, 3.69989013671875, 3.8233642578125, 3.94683837890625, 4.0703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 3.0, 4.0, 11.0, 5.0, 18.0, 22.0, 28.0, 36.0, 42.0, 65.0, 86.0, 111.0, 195.0, 286.0, 529.0, 649.0, 626.0, 472.0, 316.0, 161.0, 100.0, 72.0, 51.0, 45.0, 31.0, 19.0, 20.0, 10.0, 15.0, 7.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1875, -4.07080078125, -3.9541015625, -3.83740234375, -3.720703125, -3.60400390625, -3.4873046875, -3.37060546875, -3.25390625, -3.13720703125, -3.0205078125, -2.90380859375, -2.787109375, -2.67041015625, -2.5537109375, -2.43701171875, -2.3203125, -2.20361328125, -2.0869140625, -1.97021484375, -1.853515625, -1.73681640625, -1.6201171875, -1.50341796875, -1.38671875, -1.27001953125, -1.1533203125, -1.03662109375, -0.919921875, -0.80322265625, -0.6865234375, -0.56982421875, -0.453125, -0.33642578125, -0.2197265625, -0.10302734375, 0.013671875, 0.13037109375, 0.2470703125, 0.36376953125, 0.48046875, 0.59716796875, 0.7138671875, 0.83056640625, 0.947265625, 1.06396484375, 1.1806640625, 1.29736328125, 1.4140625, 1.53076171875, 1.6474609375, 1.76416015625, 1.880859375, 1.99755859375, 2.1142578125, 2.23095703125, 2.34765625, 2.46435546875, 2.5810546875, 2.69775390625, 2.814453125, 2.93115234375, 3.0478515625, 3.16455078125, 3.28125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 29.0, 58.0, 119.0, 191.0, 218.0, 169.0, 99.0, 33.0, 26.0, 19.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.176084518432617, -28.619718551635742, -27.063350677490234, -25.50698471069336, -23.950618743896484, -22.39425277709961, -20.837886810302734, -19.281518936157227, -17.72515296936035, -16.168787002563477, -14.612420082092285, -13.056053161621094, -11.499687194824219, -9.943321228027344, -8.386954307556152, -6.830587387084961, -5.274221420288086, -3.7178549766540527, -2.1614885330200195, -0.6051220893859863, 0.9512443542480469, 2.50761079788208, 4.063977241516113, 5.620344161987305, 7.17671012878418, 8.733076095581055, 10.289443016052246, 11.845809936523438, 13.402175903320312, 14.958541870117188, 16.514907836914062, 18.07127571105957, 19.627639770507812, 21.184005737304688, 22.740371704101562, 24.29673957824707, 25.853105545043945, 27.40947151184082, 28.965839385986328, 30.522205352783203, 32.07857131958008, 33.63493728637695, 35.19130325317383, 36.7476692199707, 38.304039001464844, 39.86040496826172, 41.416770935058594, 42.97313690185547, 44.529502868652344, 46.08586883544922, 47.642234802246094, 49.19860076904297, 50.754966735839844, 52.311336517333984, 53.86770248413086, 55.424068450927734, 56.98043441772461, 58.536800384521484, 60.09316635131836, 61.649532318115234, 63.205902099609375, 64.76226806640625, 66.31863403320312, 67.875, 69.43136596679688]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 18.0, 15.0, 9.0, 31.0, 62.0, 85.0, 73.0, 81.0, 98.0, 120.0, 98.0, 82.0, 62.0, 51.0, 33.0, 32.0, 26.0, 13.0, 9.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40704345703125, -58.18239212036133, -56.95773696899414, -55.73308563232422, -54.50843048095703, -53.28377914428711, -52.05912780761719, -50.83447265625, -49.60982131958008, -48.385169982910156, -47.16051483154297, -45.93586349487305, -44.711212158203125, -43.48655700683594, -42.261905670166016, -41.037254333496094, -39.812599182128906, -38.587947845458984, -37.3632926940918, -36.138641357421875, -34.91398620605469, -33.689334869384766, -32.464683532714844, -31.24003028869629, -30.015377044677734, -28.79072380065918, -27.566070556640625, -26.341419219970703, -25.11676597595215, -23.892112731933594, -22.667461395263672, -21.442808151245117, -20.218154907226562, -18.993501663208008, -17.768848419189453, -16.54419708251953, -15.319543838500977, -14.094890594482422, -12.870238304138184, -11.645586013793945, -10.42093276977539, -9.196279525756836, -7.971627235412598, -6.746974468231201, -5.522321701049805, -4.297668933868408, -3.0730161666870117, -1.8483638763427734, -0.6237106323242188, 0.6009421348571777, 1.8255949020385742, 3.0502476692199707, 4.274900436401367, 5.499553203582764, 6.72420597076416, 7.948858261108398, 9.173511505126953, 10.398164749145508, 11.622817039489746, 12.847469329833984, 14.072122573852539, 15.296775817871094, 16.521427154541016, 17.74608039855957, 18.970733642578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 9.0, 8.0, 7.0, 9.0, 17.0, 17.0, 28.0, 46.0, 63.0, 90.0, 151.0, 204.0, 309.0, 515.0, 907.0, 1552.0, 2668.0, 4886.0, 8990.0, 17493.0, 34446.0, 67147.0, 132680.0, 267296.0, 253364.0, 124332.0, 63291.0, 32009.0, 16725.0, 8484.0, 4651.0, 2456.0, 1440.0, 829.0, 521.0, 291.0, 187.0, 129.0, 89.0, 69.0, 42.0, 27.0, 22.0, 16.0, 10.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.171875, -2.099365234375, -2.02685546875, -1.954345703125, -1.8818359375, -1.809326171875, -1.73681640625, -1.664306640625, -1.591796875, -1.519287109375, -1.44677734375, -1.374267578125, -1.3017578125, -1.229248046875, -1.15673828125, -1.084228515625, -1.01171875, -0.939208984375, -0.86669921875, -0.794189453125, -0.7216796875, -0.649169921875, -0.57666015625, -0.504150390625, -0.431640625, -0.359130859375, -0.28662109375, -0.214111328125, -0.1416015625, -0.069091796875, 0.00341796875, 0.075927734375, 0.1484375, 0.220947265625, 0.29345703125, 0.365966796875, 0.4384765625, 0.510986328125, 0.58349609375, 0.656005859375, 0.728515625, 0.801025390625, 0.87353515625, 0.946044921875, 1.0185546875, 1.091064453125, 1.16357421875, 1.236083984375, 1.30859375, 1.381103515625, 1.45361328125, 1.526123046875, 1.5986328125, 1.671142578125, 1.74365234375, 1.816162109375, 1.888671875, 1.961181640625, 2.03369140625, 2.106201171875, 2.1787109375, 2.251220703125, 2.32373046875, 2.396240234375, 2.46875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 0.0, 9.0, 10.0, 17.0, 21.0, 41.0, 29.0, 47.0, 64.0, 59.0, 89.0, 82.0, 79.0, 77.0, 71.0, 63.0, 56.0, 43.0, 41.0, 26.0, 22.0, 17.0, 14.0, 10.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2392578125, -1.1761322021484375, -1.113006591796875, -1.0498809814453125, -0.98675537109375, -0.9236297607421875, -0.860504150390625, -0.7973785400390625, -0.7342529296875, -0.6711273193359375, -0.608001708984375, -0.5448760986328125, -0.48175048828125, -0.4186248779296875, -0.355499267578125, -0.2923736572265625, -0.229248046875, -0.1661224365234375, -0.102996826171875, -0.0398712158203125, 0.02325439453125, 0.0863800048828125, 0.149505615234375, 0.2126312255859375, 0.2757568359375, 0.3388824462890625, 0.402008056640625, 0.4651336669921875, 0.52825927734375, 0.5913848876953125, 0.654510498046875, 0.7176361083984375, 0.78076171875, 0.8438873291015625, 0.907012939453125, 0.9701385498046875, 1.03326416015625, 1.0963897705078125, 1.159515380859375, 1.2226409912109375, 1.2857666015625, 1.3488922119140625, 1.412017822265625, 1.4751434326171875, 1.53826904296875, 1.6013946533203125, 1.664520263671875, 1.7276458740234375, 1.790771484375, 1.8538970947265625, 1.917022705078125, 1.9801483154296875, 2.04327392578125, 2.1063995361328125, 2.169525146484375, 2.2326507568359375, 2.2957763671875, 2.3589019775390625, 2.422027587890625, 2.4851531982421875, 2.54827880859375, 2.6114044189453125, 2.674530029296875, 2.7376556396484375, 2.80078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 12.0, 17.0, 12.0, 21.0, 28.0, 64.0, 76.0, 124.0, 198.0, 324.0, 561.0, 1118.0, 2509.0, 7675.0, 57183.0, 818396.0, 140742.0, 13009.0, 3276.0, 1379.0, 733.0, 404.0, 226.0, 155.0, 102.0, 56.0, 43.0, 26.0, 12.0, 15.0, 10.0, 11.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.154541015625, -8.85595703125, -8.557373046875, -8.2587890625, -7.960205078125, -7.66162109375, -7.363037109375, -7.064453125, -6.765869140625, -6.46728515625, -6.168701171875, -5.8701171875, -5.571533203125, -5.27294921875, -4.974365234375, -4.67578125, -4.377197265625, -4.07861328125, -3.780029296875, -3.4814453125, -3.182861328125, -2.88427734375, -2.585693359375, -2.287109375, -1.988525390625, -1.68994140625, -1.391357421875, -1.0927734375, -0.794189453125, -0.49560546875, -0.197021484375, 0.1015625, 0.400146484375, 0.69873046875, 0.997314453125, 1.2958984375, 1.594482421875, 1.89306640625, 2.191650390625, 2.490234375, 2.788818359375, 3.08740234375, 3.385986328125, 3.6845703125, 3.983154296875, 4.28173828125, 4.580322265625, 4.87890625, 5.177490234375, 5.47607421875, 5.774658203125, 6.0732421875, 6.371826171875, 6.67041015625, 6.968994140625, 7.267578125, 7.566162109375, 7.86474609375, 8.163330078125, 8.4619140625, 8.760498046875, 9.05908203125, 9.357666015625, 9.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 15.0, 5.0, 7.0, 17.0, 17.0, 20.0, 33.0, 28.0, 30.0, 35.0, 33.0, 50.0, 53.0, 57.0, 63.0, 48.0, 62.0, 45.0, 56.0, 48.0, 30.0, 29.0, 24.0, 37.0, 16.0, 33.0, 26.0, 16.0, 13.0, 7.0, 7.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9921875, -5.78424072265625, -5.5762939453125, -5.36834716796875, -5.160400390625, -4.95245361328125, -4.7445068359375, -4.53656005859375, -4.32861328125, -4.12066650390625, -3.9127197265625, -3.70477294921875, -3.496826171875, -3.28887939453125, -3.0809326171875, -2.87298583984375, -2.6650390625, -2.45709228515625, -2.2491455078125, -2.04119873046875, -1.833251953125, -1.62530517578125, -1.4173583984375, -1.20941162109375, -1.00146484375, -0.79351806640625, -0.5855712890625, -0.37762451171875, -0.169677734375, 0.03826904296875, 0.2462158203125, 0.45416259765625, 0.662109375, 0.87005615234375, 1.0780029296875, 1.28594970703125, 1.493896484375, 1.70184326171875, 1.9097900390625, 2.11773681640625, 2.32568359375, 2.53363037109375, 2.7415771484375, 2.94952392578125, 3.157470703125, 3.36541748046875, 3.5733642578125, 3.78131103515625, 3.9892578125, 4.19720458984375, 4.4051513671875, 4.61309814453125, 4.821044921875, 5.02899169921875, 5.2369384765625, 5.44488525390625, 5.65283203125, 5.86077880859375, 6.0687255859375, 6.27667236328125, 6.484619140625, 6.69256591796875, 6.9005126953125, 7.10845947265625, 7.31640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 25.0, 31.0, 61.0, 95.0, 169.0, 329.0, 778.0, 2400.0, 10309.0, 77471.0, 801129.0, 135358.0, 15317.0, 3211.0, 992.0, 386.0, 159.0, 94.0, 71.0, 48.0, 24.0, 12.0, 18.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.6484375, -3.545989990234375, -3.44354248046875, -3.341094970703125, -3.2386474609375, -3.136199951171875, -3.03375244140625, -2.931304931640625, -2.828857421875, -2.726409912109375, -2.62396240234375, -2.521514892578125, -2.4190673828125, -2.316619873046875, -2.21417236328125, -2.111724853515625, -2.00927734375, -1.906829833984375, -1.80438232421875, -1.701934814453125, -1.5994873046875, -1.497039794921875, -1.39459228515625, -1.292144775390625, -1.189697265625, -1.087249755859375, -0.98480224609375, -0.882354736328125, -0.7799072265625, -0.677459716796875, -0.57501220703125, -0.472564697265625, -0.3701171875, -0.267669677734375, -0.16522216796875, -0.062774658203125, 0.0396728515625, 0.142120361328125, 0.24456787109375, 0.347015380859375, 0.449462890625, 0.551910400390625, 0.65435791015625, 0.756805419921875, 0.8592529296875, 0.961700439453125, 1.06414794921875, 1.166595458984375, 1.26904296875, 1.371490478515625, 1.47393798828125, 1.576385498046875, 1.6788330078125, 1.781280517578125, 1.88372802734375, 1.986175537109375, 2.088623046875, 2.191070556640625, 2.29351806640625, 2.395965576171875, 2.4984130859375, 2.600860595703125, 2.70330810546875, 2.805755615234375, 2.908203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 5.0, 5.0, 10.0, 9.0, 10.0, 17.0, 17.0, 34.0, 34.0, 48.0, 73.0, 116.0, 195.0, 131.0, 75.0, 61.0, 39.0, 30.0, 24.0, 10.0, 15.0, 13.0, 7.0, 4.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005507469177246094, -0.0005264952778816223, -0.0005022436380386353, -0.0004779919981956482, -0.00045374035835266113, -0.00042948871850967407, -0.000405237078666687, -0.00038098543882369995, -0.0003567337989807129, -0.00033248215913772583, -0.00030823051929473877, -0.0002839788794517517, -0.00025972723960876465, -0.0002354755997657776, -0.00021122395992279053, -0.00018697232007980347, -0.0001627206802368164, -0.00013846904039382935, -0.00011421740055084229, -8.996576070785522e-05, -6.571412086486816e-05, -4.1462481021881104e-05, -1.7210841178894043e-05, 7.040798664093018e-06, 3.129243850708008e-05, 5.554407835006714e-05, 7.97957181930542e-05, 0.00010404735803604126, 0.00012829899787902832, 0.00015255063772201538, 0.00017680227756500244, 0.0002010539174079895, 0.00022530555725097656, 0.0002495571970939636, 0.0002738088369369507, 0.00029806047677993774, 0.0003223121166229248, 0.00034656375646591187, 0.0003708153963088989, 0.000395067036151886, 0.00041931867599487305, 0.0004435703158378601, 0.00046782195568084717, 0.0004920735955238342, 0.0005163252353668213, 0.0005405768752098083, 0.0005648285150527954, 0.0005890801548957825, 0.0006133317947387695, 0.0006375834345817566, 0.0006618350744247437, 0.0006860867142677307, 0.0007103383541107178, 0.0007345899939537048, 0.0007588416337966919, 0.000783093273639679, 0.000807344913482666, 0.0008315965533256531, 0.0008558481931686401, 0.0008800998330116272, 0.0009043514728546143, 0.0009286031126976013, 0.0009528547525405884, 0.0009771063923835754, 0.0010013580322265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 9.0, 17.0, 10.0, 16.0, 27.0, 29.0, 63.0, 72.0, 98.0, 151.0, 277.0, 450.0, 792.0, 1504.0, 3631.0, 11446.0, 56941.0, 604594.0, 315233.0, 38350.0, 8615.0, 2926.0, 1436.0, 721.0, 414.0, 237.0, 151.0, 111.0, 75.0, 40.0, 23.0, 26.0, 25.0, 13.0, 9.0, 4.0, 7.0, 8.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.944427490234375, -1.87713623046875, -1.809844970703125, -1.7425537109375, -1.675262451171875, -1.60797119140625, -1.540679931640625, -1.473388671875, -1.406097412109375, -1.33880615234375, -1.271514892578125, -1.2042236328125, -1.136932373046875, -1.06964111328125, -1.002349853515625, -0.93505859375, -0.867767333984375, -0.80047607421875, -0.733184814453125, -0.6658935546875, -0.598602294921875, -0.53131103515625, -0.464019775390625, -0.396728515625, -0.329437255859375, -0.26214599609375, -0.194854736328125, -0.1275634765625, -0.060272216796875, 0.00701904296875, 0.074310302734375, 0.1416015625, 0.208892822265625, 0.27618408203125, 0.343475341796875, 0.4107666015625, 0.478057861328125, 0.54534912109375, 0.612640380859375, 0.679931640625, 0.747222900390625, 0.81451416015625, 0.881805419921875, 0.9490966796875, 1.016387939453125, 1.08367919921875, 1.150970458984375, 1.21826171875, 1.285552978515625, 1.35284423828125, 1.420135498046875, 1.4874267578125, 1.554718017578125, 1.62200927734375, 1.689300537109375, 1.756591796875, 1.823883056640625, 1.89117431640625, 1.958465576171875, 2.0257568359375, 2.093048095703125, 2.16033935546875, 2.227630615234375, 2.294921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 5.0, 11.0, 7.0, 11.0, 25.0, 22.0, 21.0, 31.0, 38.0, 38.0, 48.0, 64.0, 64.0, 87.0, 83.0, 68.0, 54.0, 47.0, 47.0, 34.0, 30.0, 33.0, 20.0, 14.0, 22.0, 12.0, 5.0, 7.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.794921875, -1.7417755126953125, -1.688629150390625, -1.6354827880859375, -1.58233642578125, -1.5291900634765625, -1.476043701171875, -1.4228973388671875, -1.3697509765625, -1.3166046142578125, -1.263458251953125, -1.2103118896484375, -1.15716552734375, -1.1040191650390625, -1.050872802734375, -0.9977264404296875, -0.944580078125, -0.8914337158203125, -0.838287353515625, -0.7851409912109375, -0.73199462890625, -0.6788482666015625, -0.625701904296875, -0.5725555419921875, -0.5194091796875, -0.4662628173828125, -0.413116455078125, -0.3599700927734375, -0.30682373046875, -0.2536773681640625, -0.200531005859375, -0.1473846435546875, -0.09423828125, -0.0410919189453125, 0.012054443359375, 0.0652008056640625, 0.11834716796875, 0.1714935302734375, 0.224639892578125, 0.2777862548828125, 0.3309326171875, 0.3840789794921875, 0.437225341796875, 0.4903717041015625, 0.54351806640625, 0.5966644287109375, 0.649810791015625, 0.7029571533203125, 0.756103515625, 0.8092498779296875, 0.862396240234375, 0.9155426025390625, 0.96868896484375, 1.0218353271484375, 1.074981689453125, 1.1281280517578125, 1.1812744140625, 1.2344207763671875, 1.287567138671875, 1.3407135009765625, 1.39385986328125, 1.4470062255859375, 1.500152587890625, 1.5532989501953125, 1.6064453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 12.0, 19.0, 34.0, 54.0, 104.0, 156.0, 215.0, 116.0, 102.0, 67.0, 39.0, 23.0, 14.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8177604675293, -38.551513671875, -37.28527069091797, -36.01902389526367, -34.752777099609375, -33.48653030395508, -32.22028350830078, -30.95404052734375, -29.687793731689453, -28.421546936035156, -27.155302047729492, -25.889057159423828, -24.62281036376953, -23.356563568115234, -22.09031867980957, -20.824073791503906, -19.55782699584961, -18.291580200195312, -17.02533531188965, -15.759089469909668, -14.492843627929688, -13.226597785949707, -11.960351943969727, -10.694106101989746, -9.427860260009766, -8.161614418029785, -6.895368576049805, -5.629122734069824, -4.362876892089844, -3.0966310501098633, -1.8303852081298828, -0.5641393661499023, 0.7021064758300781, 1.9683523178100586, 3.234598159790039, 4.5008440017700195, 5.76708984375, 7.0333356857299805, 8.299581527709961, 9.565827369689941, 10.832073211669922, 12.098319053649902, 13.364564895629883, 14.630810737609863, 15.897056579589844, 17.16330337524414, 18.429548263549805, 19.69579315185547, 20.962039947509766, 22.228286743164062, 23.494531631469727, 24.76077651977539, 26.027023315429688, 27.293270111083984, 28.55951499938965, 29.825759887695312, 31.09200668334961, 32.358253479003906, 33.62449645996094, 34.890743255615234, 36.15699005126953, 37.42323684692383, 38.689483642578125, 39.955726623535156, 41.22197341918945]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 0.0, 4.0, 5.0, 8.0, 4.0, 9.0, 10.0, 12.0, 18.0, 33.0, 26.0, 27.0, 31.0, 19.0, 36.0, 45.0, 45.0, 54.0, 64.0, 79.0, 75.0, 51.0, 38.0, 32.0, 31.0, 28.0, 35.0, 20.0, 25.0, 19.0, 17.0, 21.0, 16.0, 8.0, 15.0, 10.0, 9.0, 7.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.91098403930664, -24.229276657104492, -23.54756736755371, -22.865859985351562, -22.184152603149414, -21.502445220947266, -20.820735931396484, -20.139028549194336, -19.457321166992188, -18.77561378479004, -18.093904495239258, -17.41219711303711, -16.73048973083496, -16.048782348632812, -15.367073059082031, -14.685365676879883, -14.003656387329102, -13.321948051452637, -12.640240669250488, -11.958532333374023, -11.276824951171875, -10.59511661529541, -9.913408279418945, -9.231700897216797, -8.549992561340332, -7.868284702301025, -7.186576843261719, -6.504868507385254, -5.823160648345947, -5.141452789306641, -4.459744453430176, -3.778036594390869, -3.0963287353515625, -2.414620876312256, -1.7329127788543701, -1.0512046813964844, -0.36949682235717773, 0.3122110366821289, 0.9939193725585938, 1.6756272315979004, 2.357335090637207, 3.0390429496765137, 3.7207510471343994, 4.402459144592285, 5.084167003631592, 5.765874862670898, 6.447583198547363, 7.12929105758667, 7.810998916625977, 8.492707252502441, 9.17441463470459, 9.856122970581055, 10.537830352783203, 11.219538688659668, 11.901247024536133, 12.582954406738281, 13.264662742614746, 13.946371078491211, 14.62807846069336, 15.309786796569824, 15.991495132446289, 16.673202514648438, 17.35491180419922, 18.036619186401367, 18.718326568603516]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 8.0, 13.0, 20.0, 27.0, 36.0, 59.0, 112.0, 187.0, 344.0, 738.0, 1382.0, 3240.0, 8173.0, 25567.0, 110115.0, 1360104.0, 2449023.0, 181455.0, 35077.0, 10896.0, 4155.0, 1739.0, 784.0, 402.0, 248.0, 142.0, 95.0, 42.0, 33.0, 18.0, 11.0, 11.0, 5.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6875, -2.598297119140625, -2.50909423828125, -2.419891357421875, -2.3306884765625, -2.241485595703125, -2.15228271484375, -2.063079833984375, -1.973876953125, -1.884674072265625, -1.79547119140625, -1.706268310546875, -1.6170654296875, -1.527862548828125, -1.43865966796875, -1.349456787109375, -1.26025390625, -1.171051025390625, -1.08184814453125, -0.992645263671875, -0.9034423828125, -0.814239501953125, -0.72503662109375, -0.635833740234375, -0.546630859375, -0.457427978515625, -0.36822509765625, -0.279022216796875, -0.1898193359375, -0.100616455078125, -0.01141357421875, 0.077789306640625, 0.1669921875, 0.256195068359375, 0.34539794921875, 0.434600830078125, 0.5238037109375, 0.613006591796875, 0.70220947265625, 0.791412353515625, 0.880615234375, 0.969818115234375, 1.05902099609375, 1.148223876953125, 1.2374267578125, 1.326629638671875, 1.41583251953125, 1.505035400390625, 1.59423828125, 1.683441162109375, 1.77264404296875, 1.861846923828125, 1.9510498046875, 2.040252685546875, 2.12945556640625, 2.218658447265625, 2.307861328125, 2.397064208984375, 2.48626708984375, 2.575469970703125, 2.6646728515625, 2.753875732421875, 2.84307861328125, 2.932281494140625, 3.021484375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 12.0, 26.0, 17.0, 20.0, 29.0, 33.0, 35.0, 36.0, 30.0, 63.0, 55.0, 50.0, 49.0, 38.0, 54.0, 52.0, 39.0, 39.0, 43.0, 32.0, 24.0, 21.0, 22.0, 21.0, 23.0, 18.0, 18.0, 9.0, 7.0, 8.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.3623046875, -1.32452392578125, -1.2867431640625, -1.24896240234375, -1.211181640625, -1.17340087890625, -1.1356201171875, -1.09783935546875, -1.06005859375, -1.02227783203125, -0.9844970703125, -0.94671630859375, -0.908935546875, -0.87115478515625, -0.8333740234375, -0.79559326171875, -0.7578125, -0.72003173828125, -0.6822509765625, -0.64447021484375, -0.606689453125, -0.56890869140625, -0.5311279296875, -0.49334716796875, -0.45556640625, -0.41778564453125, -0.3800048828125, -0.34222412109375, -0.304443359375, -0.26666259765625, -0.2288818359375, -0.19110107421875, -0.1533203125, -0.11553955078125, -0.0777587890625, -0.03997802734375, -0.002197265625, 0.03558349609375, 0.0733642578125, 0.11114501953125, 0.14892578125, 0.18670654296875, 0.2244873046875, 0.26226806640625, 0.300048828125, 0.33782958984375, 0.3756103515625, 0.41339111328125, 0.451171875, 0.48895263671875, 0.5267333984375, 0.56451416015625, 0.602294921875, 0.64007568359375, 0.6778564453125, 0.71563720703125, 0.75341796875, 0.79119873046875, 0.8289794921875, 0.86676025390625, 0.904541015625, 0.94232177734375, 0.9801025390625, 1.01788330078125, 1.0556640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 9.0, 5.0, 6.0, 12.0, 24.0, 30.0, 48.0, 68.0, 111.0, 159.0, 324.0, 509.0, 914.0, 1872.0, 4030.0, 10436.0, 35257.0, 198550.0, 3127794.0, 713243.0, 71070.0, 17906.0, 6097.0, 2658.0, 1320.0, 707.0, 417.0, 237.0, 167.0, 94.0, 49.0, 49.0, 27.0, 23.0, 13.0, 11.0, 9.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.22998046875, -4.0966796875, -3.96337890625, -3.830078125, -3.69677734375, -3.5634765625, -3.43017578125, -3.296875, -3.16357421875, -3.0302734375, -2.89697265625, -2.763671875, -2.63037109375, -2.4970703125, -2.36376953125, -2.23046875, -2.09716796875, -1.9638671875, -1.83056640625, -1.697265625, -1.56396484375, -1.4306640625, -1.29736328125, -1.1640625, -1.03076171875, -0.8974609375, -0.76416015625, -0.630859375, -0.49755859375, -0.3642578125, -0.23095703125, -0.09765625, 0.03564453125, 0.1689453125, 0.30224609375, 0.435546875, 0.56884765625, 0.7021484375, 0.83544921875, 0.96875, 1.10205078125, 1.2353515625, 1.36865234375, 1.501953125, 1.63525390625, 1.7685546875, 1.90185546875, 2.03515625, 2.16845703125, 2.3017578125, 2.43505859375, 2.568359375, 2.70166015625, 2.8349609375, 2.96826171875, 3.1015625, 3.23486328125, 3.3681640625, 3.50146484375, 3.634765625, 3.76806640625, 3.9013671875, 4.03466796875, 4.16796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 11.0, 13.0, 19.0, 38.0, 36.0, 72.0, 117.0, 174.0, 368.0, 843.0, 1070.0, 583.0, 277.0, 156.0, 83.0, 68.0, 37.0, 37.0, 15.0, 6.0, 8.0, 5.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.65142822265625, -4.4747314453125, -4.29803466796875, -4.121337890625, -3.94464111328125, -3.7679443359375, -3.59124755859375, -3.41455078125, -3.23785400390625, -3.0611572265625, -2.88446044921875, -2.707763671875, -2.53106689453125, -2.3543701171875, -2.17767333984375, -2.0009765625, -1.82427978515625, -1.6475830078125, -1.47088623046875, -1.294189453125, -1.11749267578125, -0.9407958984375, -0.76409912109375, -0.58740234375, -0.41070556640625, -0.2340087890625, -0.05731201171875, 0.119384765625, 0.29608154296875, 0.4727783203125, 0.64947509765625, 0.826171875, 1.00286865234375, 1.1795654296875, 1.35626220703125, 1.532958984375, 1.70965576171875, 1.8863525390625, 2.06304931640625, 2.23974609375, 2.41644287109375, 2.5931396484375, 2.76983642578125, 2.946533203125, 3.12322998046875, 3.2999267578125, 3.47662353515625, 3.6533203125, 3.83001708984375, 4.0067138671875, 4.18341064453125, 4.360107421875, 4.53680419921875, 4.7135009765625, 4.89019775390625, 5.06689453125, 5.24359130859375, 5.4202880859375, 5.59698486328125, 5.773681640625, 5.95037841796875, 6.1270751953125, 6.30377197265625, 6.48046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 13.0, 30.0, 61.0, 149.0, 238.0, 231.0, 140.0, 80.0, 20.0, 12.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.4642448425293, -61.53456497192383, -59.60488510131836, -57.67520523071289, -55.74552536010742, -53.81584930419922, -51.88616943359375, -49.95648956298828, -48.02680969238281, -46.097129821777344, -44.167449951171875, -42.237770080566406, -40.30809020996094, -38.37841033935547, -36.44873046875, -34.5190544128418, -32.58937072753906, -30.659690856933594, -28.730010986328125, -26.800331115722656, -24.87065315246582, -22.94097328186035, -21.011293411254883, -19.081615447998047, -17.151935577392578, -15.22225570678711, -13.292576789855957, -11.362896919250488, -9.433218002319336, -7.503538131713867, -5.573858261108398, -3.644179344177246, -1.7145004272460938, 0.21517908573150635, 2.1448585987091064, 4.074538230895996, 6.004217624664307, 7.933897018432617, 9.863576889038086, 11.793255805969238, 13.722935676574707, 15.652615547180176, 17.582294464111328, 19.511974334716797, 21.441654205322266, 23.371334075927734, 25.301013946533203, 27.23069190979004, 29.160371780395508, 31.090051651000977, 33.01972961425781, 34.94940948486328, 36.87908935546875, 38.80876922607422, 40.73844909667969, 42.668128967285156, 44.597808837890625, 46.527488708496094, 48.45716857910156, 50.38684844970703, 52.3165283203125, 54.24620819091797, 56.17588806152344, 58.10556411743164, 60.03524398803711]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 10.0, 3.0, 7.0, 7.0, 10.0, 9.0, 12.0, 13.0, 22.0, 18.0, 16.0, 32.0, 33.0, 35.0, 34.0, 42.0, 36.0, 51.0, 48.0, 50.0, 44.0, 56.0, 46.0, 61.0, 33.0, 31.0, 31.0, 27.0, 31.0, 29.0, 20.0, 16.0, 19.0, 15.0, 11.0, 7.0, 7.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.495256423950195, -19.847238540649414, -19.19921875, -18.55120086669922, -17.903182983398438, -17.255165100097656, -16.607147216796875, -15.959127426147461, -15.31110954284668, -14.663091659545898, -14.0150728225708, -13.367053985595703, -12.719036102294922, -12.07101821899414, -11.422999382019043, -10.774980545043945, -10.126962661743164, -9.478944778442383, -8.830925941467285, -8.182907104492188, -7.534889221191406, -6.886870861053467, -6.238852500915527, -5.590834140777588, -4.942815780639648, -4.294797420501709, -3.6467790603637695, -2.99876070022583, -2.3507423400878906, -1.7027239799499512, -1.0547056198120117, -0.40668725967407227, 0.24132919311523438, 0.8893475532531738, 1.5373659133911133, 2.1853842735290527, 2.833402633666992, 3.4814209938049316, 4.129439353942871, 4.7774577140808105, 5.42547607421875, 6.0734944343566895, 6.721512794494629, 7.369531154632568, 8.017549514770508, 8.665567398071289, 9.313586235046387, 9.961605072021484, 10.609622955322266, 11.257640838623047, 11.905659675598145, 12.553678512573242, 13.201696395874023, 13.849714279174805, 14.497733116149902, 15.145751953125, 15.793769836425781, 16.441787719726562, 17.089805603027344, 17.737825393676758, 18.38584327697754, 19.03386116027832, 19.681880950927734, 20.329898834228516, 20.977916717529297]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 9.0, 11.0, 23.0, 33.0, 63.0, 73.0, 95.0, 140.0, 202.0, 291.0, 449.0, 630.0, 998.0, 1438.0, 2317.0, 3583.0, 5820.0, 9613.0, 16837.0, 30694.0, 58959.0, 124264.0, 257275.0, 265974.0, 130507.0, 61716.0, 32126.0, 17558.0, 9977.0, 6131.0, 3784.0, 2382.0, 1514.0, 988.0, 689.0, 411.0, 288.0, 240.0, 125.0, 98.0, 70.0, 52.0, 22.0, 29.0, 10.0, 9.0, 8.0, 4.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1015625, -2.033843994140625, -1.96612548828125, -1.898406982421875, -1.8306884765625, -1.762969970703125, -1.69525146484375, -1.627532958984375, -1.559814453125, -1.492095947265625, -1.42437744140625, -1.356658935546875, -1.2889404296875, -1.221221923828125, -1.15350341796875, -1.085784912109375, -1.01806640625, -0.950347900390625, -0.88262939453125, -0.814910888671875, -0.7471923828125, -0.679473876953125, -0.61175537109375, -0.544036865234375, -0.476318359375, -0.408599853515625, -0.34088134765625, -0.273162841796875, -0.2054443359375, -0.137725830078125, -0.07000732421875, -0.002288818359375, 0.0654296875, 0.133148193359375, 0.20086669921875, 0.268585205078125, 0.3363037109375, 0.404022216796875, 0.47174072265625, 0.539459228515625, 0.607177734375, 0.674896240234375, 0.74261474609375, 0.810333251953125, 0.8780517578125, 0.945770263671875, 1.01348876953125, 1.081207275390625, 1.14892578125, 1.216644287109375, 1.28436279296875, 1.352081298828125, 1.4197998046875, 1.487518310546875, 1.55523681640625, 1.622955322265625, 1.690673828125, 1.758392333984375, 1.82611083984375, 1.893829345703125, 1.9615478515625, 2.029266357421875, 2.09698486328125, 2.164703369140625, 2.232421875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 5.0, 12.0, 19.0, 14.0, 29.0, 38.0, 30.0, 41.0, 40.0, 37.0, 45.0, 55.0, 40.0, 43.0, 44.0, 64.0, 39.0, 41.0, 47.0, 27.0, 41.0, 39.0, 34.0, 31.0, 27.0, 15.0, 17.0, 13.0, 4.0, 7.0, 13.0, 6.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32379150390625, -1.2774658203125, -1.23114013671875, -1.184814453125, -1.13848876953125, -1.0921630859375, -1.04583740234375, -0.99951171875, -0.95318603515625, -0.9068603515625, -0.86053466796875, -0.814208984375, -0.76788330078125, -0.7215576171875, -0.67523193359375, -0.62890625, -0.58258056640625, -0.5362548828125, -0.48992919921875, -0.443603515625, -0.39727783203125, -0.3509521484375, -0.30462646484375, -0.25830078125, -0.21197509765625, -0.1656494140625, -0.11932373046875, -0.072998046875, -0.02667236328125, 0.0196533203125, 0.06597900390625, 0.1123046875, 0.15863037109375, 0.2049560546875, 0.25128173828125, 0.297607421875, 0.34393310546875, 0.3902587890625, 0.43658447265625, 0.48291015625, 0.52923583984375, 0.5755615234375, 0.62188720703125, 0.668212890625, 0.71453857421875, 0.7608642578125, 0.80718994140625, 0.853515625, 0.89984130859375, 0.9461669921875, 0.99249267578125, 1.038818359375, 1.08514404296875, 1.1314697265625, 1.17779541015625, 1.22412109375, 1.27044677734375, 1.3167724609375, 1.36309814453125, 1.409423828125, 1.45574951171875, 1.5020751953125, 1.54840087890625, 1.5947265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 22.0, 33.0, 45.0, 72.0, 112.0, 173.0, 360.0, 671.0, 1563.0, 5792.0, 62851.0, 914679.0, 53893.0, 5252.0, 1580.0, 620.0, 317.0, 193.0, 104.0, 73.0, 40.0, 35.0, 17.0, 13.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1259765625, -9.728515625, -9.3310546875, -8.93359375, -8.5361328125, -8.138671875, -7.7412109375, -7.34375, -6.9462890625, -6.548828125, -6.1513671875, -5.75390625, -5.3564453125, -4.958984375, -4.5615234375, -4.1640625, -3.7666015625, -3.369140625, -2.9716796875, -2.57421875, -2.1767578125, -1.779296875, -1.3818359375, -0.984375, -0.5869140625, -0.189453125, 0.2080078125, 0.60546875, 1.0029296875, 1.400390625, 1.7978515625, 2.1953125, 2.5927734375, 2.990234375, 3.3876953125, 3.78515625, 4.1826171875, 4.580078125, 4.9775390625, 5.375, 5.7724609375, 6.169921875, 6.5673828125, 6.96484375, 7.3623046875, 7.759765625, 8.1572265625, 8.5546875, 8.9521484375, 9.349609375, 9.7470703125, 10.14453125, 10.5419921875, 10.939453125, 11.3369140625, 11.734375, 12.1318359375, 12.529296875, 12.9267578125, 13.32421875, 13.7216796875, 14.119140625, 14.5166015625, 14.9140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 19.0, 11.0, 24.0, 24.0, 30.0, 41.0, 52.0, 37.0, 41.0, 59.0, 59.0, 76.0, 50.0, 69.0, 62.0, 53.0, 47.0, 40.0, 43.0, 30.0, 23.0, 19.0, 12.0, 13.0, 11.0, 6.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.288330078125, -7.03759765625, -6.786865234375, -6.5361328125, -6.285400390625, -6.03466796875, -5.783935546875, -5.533203125, -5.282470703125, -5.03173828125, -4.781005859375, -4.5302734375, -4.279541015625, -4.02880859375, -3.778076171875, -3.52734375, -3.276611328125, -3.02587890625, -2.775146484375, -2.5244140625, -2.273681640625, -2.02294921875, -1.772216796875, -1.521484375, -1.270751953125, -1.02001953125, -0.769287109375, -0.5185546875, -0.267822265625, -0.01708984375, 0.233642578125, 0.484375, 0.735107421875, 0.98583984375, 1.236572265625, 1.4873046875, 1.738037109375, 1.98876953125, 2.239501953125, 2.490234375, 2.740966796875, 2.99169921875, 3.242431640625, 3.4931640625, 3.743896484375, 3.99462890625, 4.245361328125, 4.49609375, 4.746826171875, 4.99755859375, 5.248291015625, 5.4990234375, 5.749755859375, 6.00048828125, 6.251220703125, 6.501953125, 6.752685546875, 7.00341796875, 7.254150390625, 7.5048828125, 7.755615234375, 8.00634765625, 8.257080078125, 8.5078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 9.0, 18.0, 26.0, 26.0, 48.0, 63.0, 116.0, 196.0, 345.0, 720.0, 2066.0, 7382.0, 38355.0, 443391.0, 506033.0, 38573.0, 7610.0, 2034.0, 707.0, 324.0, 183.0, 101.0, 61.0, 55.0, 27.0, 23.0, 19.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.0357666015625, -1.954345703125, -1.8729248046875, -1.79150390625, -1.7100830078125, -1.628662109375, -1.5472412109375, -1.4658203125, -1.3843994140625, -1.302978515625, -1.2215576171875, -1.14013671875, -1.0587158203125, -0.977294921875, -0.8958740234375, -0.814453125, -0.7330322265625, -0.651611328125, -0.5701904296875, -0.48876953125, -0.4073486328125, -0.325927734375, -0.2445068359375, -0.1630859375, -0.0816650390625, -0.000244140625, 0.0811767578125, 0.16259765625, 0.2440185546875, 0.325439453125, 0.4068603515625, 0.48828125, 0.5697021484375, 0.651123046875, 0.7325439453125, 0.81396484375, 0.8953857421875, 0.976806640625, 1.0582275390625, 1.1396484375, 1.2210693359375, 1.302490234375, 1.3839111328125, 1.46533203125, 1.5467529296875, 1.628173828125, 1.7095947265625, 1.791015625, 1.8724365234375, 1.953857421875, 2.0352783203125, 2.11669921875, 2.1981201171875, 2.279541015625, 2.3609619140625, 2.4423828125, 2.5238037109375, 2.605224609375, 2.6866455078125, 2.76806640625, 2.8494873046875, 2.930908203125, 3.0123291015625, 3.09375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 9.0, 11.0, 5.0, 16.0, 16.0, 21.0, 26.0, 31.0, 51.0, 76.0, 95.0, 133.0, 135.0, 96.0, 68.0, 36.0, 33.0, 31.0, 26.0, 22.0, 9.0, 10.0, 6.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005865097045898438, -0.0005697011947631836, -0.0005528926849365234, -0.0005360841751098633, -0.0005192756652832031, -0.000502467155456543, -0.0004856586456298828, -0.00046885013580322266, -0.0004520416259765625, -0.00043523311614990234, -0.0004184246063232422, -0.00040161609649658203, -0.0003848075866699219, -0.0003679990768432617, -0.00035119056701660156, -0.0003343820571899414, -0.00031757354736328125, -0.0003007650375366211, -0.00028395652770996094, -0.0002671480178833008, -0.0002503395080566406, -0.00023353099822998047, -0.0002167224884033203, -0.00019991397857666016, -0.00018310546875, -0.00016629695892333984, -0.0001494884490966797, -0.00013267993927001953, -0.00011587142944335938, -9.906291961669922e-05, -8.225440979003906e-05, -6.54458999633789e-05, -4.863739013671875e-05, -3.1828880310058594e-05, -1.5020370483398438e-05, 1.7881393432617188e-06, 1.8596649169921875e-05, 3.540515899658203e-05, 5.221366882324219e-05, 6.902217864990234e-05, 8.58306884765625e-05, 0.00010263919830322266, 0.00011944770812988281, 0.00013625621795654297, 0.00015306472778320312, 0.00016987323760986328, 0.00018668174743652344, 0.0002034902572631836, 0.00022029876708984375, 0.0002371072769165039, 0.00025391578674316406, 0.0002707242965698242, 0.0002875328063964844, 0.00030434131622314453, 0.0003211498260498047, 0.00033795833587646484, 0.000354766845703125, 0.00037157535552978516, 0.0003883838653564453, 0.00040519237518310547, 0.0004220008850097656, 0.0004388093948364258, 0.00045561790466308594, 0.0004724264144897461, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 3.0, 5.0, 4.0, 14.0, 21.0, 41.0, 70.0, 113.0, 219.0, 462.0, 862.0, 2000.0, 5930.0, 30061.0, 579680.0, 393079.0, 26675.0, 5615.0, 1972.0, 814.0, 394.0, 226.0, 112.0, 66.0, 43.0, 14.0, 15.0, 14.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.33477783203125, -2.2593994140625, -2.18402099609375, -2.108642578125, -2.03326416015625, -1.9578857421875, -1.88250732421875, -1.80712890625, -1.73175048828125, -1.6563720703125, -1.58099365234375, -1.505615234375, -1.43023681640625, -1.3548583984375, -1.27947998046875, -1.2041015625, -1.12872314453125, -1.0533447265625, -0.97796630859375, -0.902587890625, -0.82720947265625, -0.7518310546875, -0.67645263671875, -0.60107421875, -0.52569580078125, -0.4503173828125, -0.37493896484375, -0.299560546875, -0.22418212890625, -0.1488037109375, -0.07342529296875, 0.001953125, 0.07733154296875, 0.1527099609375, 0.22808837890625, 0.303466796875, 0.37884521484375, 0.4542236328125, 0.52960205078125, 0.60498046875, 0.68035888671875, 0.7557373046875, 0.83111572265625, 0.906494140625, 0.98187255859375, 1.0572509765625, 1.13262939453125, 1.2080078125, 1.28338623046875, 1.3587646484375, 1.43414306640625, 1.509521484375, 1.58489990234375, 1.6602783203125, 1.73565673828125, 1.81103515625, 1.88641357421875, 1.9617919921875, 2.03717041015625, 2.112548828125, 2.18792724609375, 2.2633056640625, 2.33868408203125, 2.4140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 9.0, 6.0, 6.0, 6.0, 14.0, 13.0, 21.0, 17.0, 17.0, 31.0, 40.0, 54.0, 64.0, 74.0, 83.0, 96.0, 73.0, 61.0, 64.0, 47.0, 55.0, 30.0, 21.0, 17.0, 22.0, 17.0, 15.0, 8.0, 9.0, 6.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8346405029296875, -1.789398193359375, -1.7441558837890625, -1.69891357421875, -1.6536712646484375, -1.608428955078125, -1.5631866455078125, -1.5179443359375, -1.4727020263671875, -1.427459716796875, -1.3822174072265625, -1.33697509765625, -1.2917327880859375, -1.246490478515625, -1.2012481689453125, -1.156005859375, -1.1107635498046875, -1.065521240234375, -1.0202789306640625, -0.97503662109375, -0.9297943115234375, -0.884552001953125, -0.8393096923828125, -0.7940673828125, -0.7488250732421875, -0.703582763671875, -0.6583404541015625, -0.61309814453125, -0.5678558349609375, -0.522613525390625, -0.4773712158203125, -0.43212890625, -0.3868865966796875, -0.341644287109375, -0.2964019775390625, -0.25115966796875, -0.2059173583984375, -0.160675048828125, -0.1154327392578125, -0.0701904296875, -0.0249481201171875, 0.020294189453125, 0.0655364990234375, 0.11077880859375, 0.1560211181640625, 0.201263427734375, 0.2465057373046875, 0.291748046875, 0.3369903564453125, 0.382232666015625, 0.4274749755859375, 0.47271728515625, 0.5179595947265625, 0.563201904296875, 0.6084442138671875, 0.6536865234375, 0.6989288330078125, 0.744171142578125, 0.7894134521484375, 0.83465576171875, 0.8798980712890625, 0.925140380859375, 0.9703826904296875, 1.015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 20.0, 33.0, 71.0, 84.0, 141.0, 205.0, 156.0, 103.0, 64.0, 32.0, 23.0, 18.0, 6.0, 7.0, 2.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.67342758178711, -42.45110321044922, -41.22877502441406, -40.006446838378906, -38.784122467041016, -37.561798095703125, -36.33946990966797, -35.11714172363281, -33.89481735229492, -32.67249298095703, -31.450164794921875, -30.22783851623535, -29.005512237548828, -27.783185958862305, -26.56085968017578, -25.338533401489258, -24.116207122802734, -22.89388084411621, -21.671554565429688, -20.449228286743164, -19.22690200805664, -18.004575729370117, -16.782249450683594, -15.55992317199707, -14.337596893310547, -13.115270614624023, -11.8929443359375, -10.670618057250977, -9.448291778564453, -8.22596549987793, -7.003639221191406, -5.781312942504883, -4.558990478515625, -3.3366641998291016, -2.114337921142578, -0.8920116424560547, 0.33031463623046875, 1.5526409149169922, 2.7749671936035156, 3.997293472290039, 5.2196197509765625, 6.441946029663086, 7.664272308349609, 8.886598587036133, 10.108924865722656, 11.33125114440918, 12.553577423095703, 13.775903701782227, 14.99822998046875, 16.220556259155273, 17.442882537841797, 18.66520881652832, 19.887535095214844, 21.109861373901367, 22.33218765258789, 23.554513931274414, 24.776840209960938, 25.99916648864746, 27.221492767333984, 28.443819046020508, 29.66614532470703, 30.888471603393555, 32.11079788208008, 33.33312225341797, 34.555450439453125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 9.0, 9.0, 10.0, 14.0, 6.0, 24.0, 22.0, 19.0, 19.0, 15.0, 16.0, 37.0, 20.0, 36.0, 38.0, 41.0, 52.0, 60.0, 75.0, 70.0, 51.0, 40.0, 36.0, 32.0, 32.0, 26.0, 16.0, 19.0, 27.0, 20.0, 12.0, 11.0, 11.0, 9.0, 9.0, 8.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-26.3154239654541, -25.593761444091797, -24.872098922729492, -24.150436401367188, -23.42877197265625, -22.707109451293945, -21.98544692993164, -21.263784408569336, -20.54212188720703, -19.820459365844727, -19.098796844482422, -18.377134323120117, -17.655471801757812, -16.933807373046875, -16.21214485168457, -15.490482330322266, -14.768819808959961, -14.047157287597656, -13.325494766235352, -12.60383129119873, -11.882168769836426, -11.160506248474121, -10.4388427734375, -9.717180252075195, -8.99551773071289, -8.273855209350586, -7.552192211151123, -6.83052921295166, -6.1088666915893555, -5.387204170227051, -4.665541172027588, -3.943878173828125, -3.222217559814453, -2.5005548000335693, -1.7788920402526855, -1.0572292804718018, -0.33556652069091797, 0.3860962390899658, 1.1077589988708496, 1.8294219970703125, 2.551084518432617, 3.272747278213501, 3.9944100379943848, 4.716073036193848, 5.437735557556152, 6.159398078918457, 6.88106107711792, 7.602724075317383, 8.324386596679688, 9.046049118041992, 9.767711639404297, 10.489375114440918, 11.211037635803223, 11.932700157165527, 12.654363632202148, 13.376026153564453, 14.097688674926758, 14.819351196289062, 15.541013717651367, 16.262676239013672, 16.98434066772461, 17.706003189086914, 18.42766571044922, 19.149328231811523, 19.870990753173828]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 6.0, 15.0, 19.0, 19.0, 38.0, 36.0, 60.0, 96.0, 168.0, 232.0, 444.0, 768.0, 1721.0, 4162.0, 13266.0, 56788.0, 736408.0, 3088648.0, 246390.0, 31173.0, 8168.0, 2877.0, 1221.0, 619.0, 324.0, 197.0, 122.0, 80.0, 63.0, 57.0, 15.0, 18.0, 15.0, 10.0, 8.0, 3.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.830474853515625, -2.73712158203125, -2.643768310546875, -2.5504150390625, -2.457061767578125, -2.36370849609375, -2.270355224609375, -2.177001953125, -2.083648681640625, -1.99029541015625, -1.896942138671875, -1.8035888671875, -1.710235595703125, -1.61688232421875, -1.523529052734375, -1.43017578125, -1.336822509765625, -1.24346923828125, -1.150115966796875, -1.0567626953125, -0.963409423828125, -0.87005615234375, -0.776702880859375, -0.683349609375, -0.589996337890625, -0.49664306640625, -0.403289794921875, -0.3099365234375, -0.216583251953125, -0.12322998046875, -0.029876708984375, 0.0634765625, 0.156829833984375, 0.25018310546875, 0.343536376953125, 0.4368896484375, 0.530242919921875, 0.62359619140625, 0.716949462890625, 0.810302734375, 0.903656005859375, 0.99700927734375, 1.090362548828125, 1.1837158203125, 1.277069091796875, 1.37042236328125, 1.463775634765625, 1.55712890625, 1.650482177734375, 1.74383544921875, 1.837188720703125, 1.9305419921875, 2.023895263671875, 2.11724853515625, 2.210601806640625, 2.303955078125, 2.397308349609375, 2.49066162109375, 2.584014892578125, 2.6773681640625, 2.770721435546875, 2.86407470703125, 2.957427978515625, 3.05078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 12.0, 7.0, 21.0, 11.0, 27.0, 31.0, 30.0, 26.0, 43.0, 57.0, 44.0, 55.0, 74.0, 63.0, 53.0, 65.0, 59.0, 44.0, 60.0, 38.0, 37.0, 37.0, 29.0, 19.0, 11.0, 9.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.395233154296875, -1.34124755859375, -1.287261962890625, -1.2332763671875, -1.179290771484375, -1.12530517578125, -1.071319580078125, -1.017333984375, -0.963348388671875, -0.90936279296875, -0.855377197265625, -0.8013916015625, -0.747406005859375, -0.69342041015625, -0.639434814453125, -0.58544921875, -0.531463623046875, -0.47747802734375, -0.423492431640625, -0.3695068359375, -0.315521240234375, -0.26153564453125, -0.207550048828125, -0.153564453125, -0.099578857421875, -0.04559326171875, 0.008392333984375, 0.0623779296875, 0.116363525390625, 0.17034912109375, 0.224334716796875, 0.2783203125, 0.332305908203125, 0.38629150390625, 0.440277099609375, 0.4942626953125, 0.548248291015625, 0.60223388671875, 0.656219482421875, 0.710205078125, 0.764190673828125, 0.81817626953125, 0.872161865234375, 0.9261474609375, 0.980133056640625, 1.03411865234375, 1.088104248046875, 1.14208984375, 1.196075439453125, 1.25006103515625, 1.304046630859375, 1.3580322265625, 1.412017822265625, 1.46600341796875, 1.519989013671875, 1.573974609375, 1.627960205078125, 1.68194580078125, 1.735931396484375, 1.7899169921875, 1.843902587890625, 1.89788818359375, 1.951873779296875, 2.005859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 18.0, 17.0, 27.0, 38.0, 66.0, 98.0, 167.0, 326.0, 720.0, 1713.0, 4832.0, 17188.0, 102098.0, 3228524.0, 777423.0, 45540.0, 10066.0, 3120.0, 1181.0, 544.0, 240.0, 135.0, 61.0, 41.0, 33.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.3671875, -4.21014404296875, -4.0531005859375, -3.89605712890625, -3.739013671875, -3.58197021484375, -3.4249267578125, -3.26788330078125, -3.11083984375, -2.95379638671875, -2.7967529296875, -2.63970947265625, -2.482666015625, -2.32562255859375, -2.1685791015625, -2.01153564453125, -1.8544921875, -1.69744873046875, -1.5404052734375, -1.38336181640625, -1.226318359375, -1.06927490234375, -0.9122314453125, -0.75518798828125, -0.59814453125, -0.44110107421875, -0.2840576171875, -0.12701416015625, 0.030029296875, 0.18707275390625, 0.3441162109375, 0.50115966796875, 0.658203125, 0.81524658203125, 0.9722900390625, 1.12933349609375, 1.286376953125, 1.44342041015625, 1.6004638671875, 1.75750732421875, 1.91455078125, 2.07159423828125, 2.2286376953125, 2.38568115234375, 2.542724609375, 2.69976806640625, 2.8568115234375, 3.01385498046875, 3.1708984375, 3.32794189453125, 3.4849853515625, 3.64202880859375, 3.799072265625, 3.95611572265625, 4.1131591796875, 4.27020263671875, 4.42724609375, 4.58428955078125, 4.7413330078125, 4.89837646484375, 5.055419921875, 5.21246337890625, 5.3695068359375, 5.52655029296875, 5.68359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 5.0, 9.0, 20.0, 17.0, 30.0, 30.0, 38.0, 78.0, 134.0, 279.0, 475.0, 915.0, 889.0, 525.0, 234.0, 146.0, 79.0, 55.0, 22.0, 21.0, 19.0, 9.0, 5.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.140625, -4.99407958984375, -4.8475341796875, -4.70098876953125, -4.554443359375, -4.40789794921875, -4.2613525390625, -4.11480712890625, -3.96826171875, -3.82171630859375, -3.6751708984375, -3.52862548828125, -3.382080078125, -3.23553466796875, -3.0889892578125, -2.94244384765625, -2.7958984375, -2.64935302734375, -2.5028076171875, -2.35626220703125, -2.209716796875, -2.06317138671875, -1.9166259765625, -1.77008056640625, -1.62353515625, -1.47698974609375, -1.3304443359375, -1.18389892578125, -1.037353515625, -0.89080810546875, -0.7442626953125, -0.59771728515625, -0.451171875, -0.30462646484375, -0.1580810546875, -0.01153564453125, 0.135009765625, 0.28155517578125, 0.4281005859375, 0.57464599609375, 0.72119140625, 0.86773681640625, 1.0142822265625, 1.16082763671875, 1.307373046875, 1.45391845703125, 1.6004638671875, 1.74700927734375, 1.8935546875, 2.04010009765625, 2.1866455078125, 2.33319091796875, 2.479736328125, 2.62628173828125, 2.7728271484375, 2.91937255859375, 3.06591796875, 3.21246337890625, 3.3590087890625, 3.50555419921875, 3.652099609375, 3.79864501953125, 3.9451904296875, 4.09173583984375, 4.23828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 18.0, 41.0, 121.0, 281.0, 296.0, 157.0, 45.0, 14.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.36859893798828, -62.23651885986328, -60.10443878173828, -57.97235870361328, -55.84027862548828, -53.70819854736328, -51.57612228393555, -49.44404220581055, -47.31196212768555, -45.17988204956055, -43.04780197143555, -40.91572189331055, -38.78364562988281, -36.65156555175781, -34.51948547363281, -32.38740539550781, -30.255325317382812, -28.123245239257812, -25.991165161132812, -23.859086990356445, -21.727006912231445, -19.594926834106445, -17.462848663330078, -15.330768585205078, -13.198688507080078, -11.066608428955078, -8.934529304504395, -6.802449703216553, -4.670370101928711, -2.538290023803711, -0.40621089935302734, 1.7258682250976562, 3.8579559326171875, 5.990035533905029, 8.122115135192871, 10.254194259643555, 12.386274337768555, 14.518354415893555, 16.650432586669922, 18.782512664794922, 20.914592742919922, 23.046672821044922, 25.178752899169922, 27.31083106994629, 29.44291114807129, 31.57499122619629, 33.707069396972656, 35.839149475097656, 37.971229553222656, 40.103309631347656, 42.235389709472656, 44.367469787597656, 46.499549865722656, 48.631629943847656, 50.76370620727539, 52.89578628540039, 55.02786636352539, 57.15994644165039, 59.29202651977539, 61.42410659790039, 63.556182861328125, 65.68826293945312, 67.82034301757812, 69.95242309570312, 72.08450317382812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 4.0, 2.0, 8.0, 13.0, 15.0, 16.0, 19.0, 21.0, 26.0, 23.0, 26.0, 37.0, 39.0, 36.0, 41.0, 41.0, 38.0, 45.0, 32.0, 37.0, 52.0, 41.0, 47.0, 43.0, 31.0, 35.0, 33.0, 24.0, 28.0, 21.0, 22.0, 20.0, 12.0, 13.0, 14.0, 9.0, 7.0, 6.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.232139587402344, -13.773418426513672, -13.314697265625, -12.855976104736328, -12.397254943847656, -11.938533782958984, -11.479812622070312, -11.02109146118164, -10.562370300292969, -10.103649139404297, -9.644927978515625, -9.186206817626953, -8.727485656738281, -8.26876449584961, -7.8100433349609375, -7.351322174072266, -6.892601490020752, -6.43388032913208, -5.975159168243408, -5.516438007354736, -5.0577168464660645, -4.598996162414551, -4.140275001525879, -3.681553602218628, -3.222832441329956, -2.764111280441284, -2.3053901195526123, -1.84666907787323, -1.387947916984558, -0.9292268753051758, -0.4705057144165039, -0.011784553527832031, 0.44693660736083984, 0.9056577682495117, 1.3643789291381836, 1.823099970817566, 2.2818212509155273, 2.74054217338562, 3.199263334274292, 3.657984495162964, 4.116705894470215, 4.575427055358887, 5.034148216247559, 5.4928693771362305, 5.951590538024902, 6.410311698913574, 6.869032859802246, 7.327754020690918, 7.786474704742432, 8.245195388793945, 8.703916549682617, 9.162637710571289, 9.621358871459961, 10.080080032348633, 10.538801193237305, 10.997522354125977, 11.456243515014648, 11.91496467590332, 12.373685836791992, 12.832406997680664, 13.291128158569336, 13.749849319458008, 14.20857048034668, 14.667291641235352, 15.126012802124023]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 6.0, 8.0, 11.0, 28.0, 37.0, 62.0, 81.0, 155.0, 277.0, 482.0, 847.0, 1610.0, 3162.0, 7017.0, 16483.0, 44684.0, 132434.0, 325286.0, 317753.0, 126026.0, 42774.0, 16022.0, 6829.0, 3002.0, 1560.0, 840.0, 429.0, 278.0, 160.0, 79.0, 52.0, 22.0, 26.0, 9.0, 14.0, 4.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.44158935546875, -2.3675537109375, -2.29351806640625, -2.219482421875, -2.14544677734375, -2.0714111328125, -1.99737548828125, -1.92333984375, -1.84930419921875, -1.7752685546875, -1.70123291015625, -1.627197265625, -1.55316162109375, -1.4791259765625, -1.40509033203125, -1.3310546875, -1.25701904296875, -1.1829833984375, -1.10894775390625, -1.034912109375, -0.96087646484375, -0.8868408203125, -0.81280517578125, -0.73876953125, -0.66473388671875, -0.5906982421875, -0.51666259765625, -0.442626953125, -0.36859130859375, -0.2945556640625, -0.22052001953125, -0.146484375, -0.07244873046875, 0.0015869140625, 0.07562255859375, 0.149658203125, 0.22369384765625, 0.2977294921875, 0.37176513671875, 0.44580078125, 0.51983642578125, 0.5938720703125, 0.66790771484375, 0.741943359375, 0.81597900390625, 0.8900146484375, 0.96405029296875, 1.0380859375, 1.11212158203125, 1.1861572265625, 1.26019287109375, 1.334228515625, 1.40826416015625, 1.4822998046875, 1.55633544921875, 1.63037109375, 1.70440673828125, 1.7784423828125, 1.85247802734375, 1.926513671875, 2.00054931640625, 2.0745849609375, 2.14862060546875, 2.22265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 11.0, 10.0, 16.0, 19.0, 30.0, 39.0, 29.0, 36.0, 40.0, 47.0, 62.0, 61.0, 68.0, 71.0, 70.0, 67.0, 53.0, 47.0, 32.0, 51.0, 24.0, 15.0, 22.0, 20.0, 11.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.5473785400390625, -1.488311767578125, -1.4292449951171875, -1.37017822265625, -1.3111114501953125, -1.252044677734375, -1.1929779052734375, -1.1339111328125, -1.0748443603515625, -1.015777587890625, -0.9567108154296875, -0.89764404296875, -0.8385772705078125, -0.779510498046875, -0.7204437255859375, -0.661376953125, -0.6023101806640625, -0.543243408203125, -0.4841766357421875, -0.42510986328125, -0.3660430908203125, -0.306976318359375, -0.2479095458984375, -0.1888427734375, -0.1297760009765625, -0.070709228515625, -0.0116424560546875, 0.04742431640625, 0.1064910888671875, 0.165557861328125, 0.2246246337890625, 0.28369140625, 0.3427581787109375, 0.401824951171875, 0.4608917236328125, 0.51995849609375, 0.5790252685546875, 0.638092041015625, 0.6971588134765625, 0.7562255859375, 0.8152923583984375, 0.874359130859375, 0.9334259033203125, 0.99249267578125, 1.0515594482421875, 1.110626220703125, 1.1696929931640625, 1.228759765625, 1.2878265380859375, 1.346893310546875, 1.4059600830078125, 1.46502685546875, 1.5240936279296875, 1.583160400390625, 1.6422271728515625, 1.7012939453125, 1.7603607177734375, 1.819427490234375, 1.8784942626953125, 1.93756103515625, 1.9966278076171875, 2.055694580078125, 2.1147613525390625, 2.173828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 4.0, 8.0, 15.0, 17.0, 24.0, 41.0, 35.0, 65.0, 91.0, 123.0, 245.0, 464.0, 939.0, 2259.0, 6461.0, 25389.0, 149307.0, 666360.0, 159033.0, 26420.0, 6738.0, 2384.0, 935.0, 484.0, 245.0, 145.0, 93.0, 55.0, 40.0, 27.0, 23.0, 12.0, 14.0, 8.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-4.44921875, -4.31646728515625, -4.1837158203125, -4.05096435546875, -3.918212890625, -3.78546142578125, -3.6527099609375, -3.51995849609375, -3.38720703125, -3.25445556640625, -3.1217041015625, -2.98895263671875, -2.856201171875, -2.72344970703125, -2.5906982421875, -2.45794677734375, -2.3251953125, -2.19244384765625, -2.0596923828125, -1.92694091796875, -1.794189453125, -1.66143798828125, -1.5286865234375, -1.39593505859375, -1.26318359375, -1.13043212890625, -0.9976806640625, -0.86492919921875, -0.732177734375, -0.59942626953125, -0.4666748046875, -0.33392333984375, -0.201171875, -0.06842041015625, 0.0643310546875, 0.19708251953125, 0.329833984375, 0.46258544921875, 0.5953369140625, 0.72808837890625, 0.86083984375, 0.99359130859375, 1.1263427734375, 1.25909423828125, 1.391845703125, 1.52459716796875, 1.6573486328125, 1.79010009765625, 1.9228515625, 2.05560302734375, 2.1883544921875, 2.32110595703125, 2.453857421875, 2.58660888671875, 2.7193603515625, 2.85211181640625, 2.98486328125, 3.11761474609375, 3.2503662109375, 3.38311767578125, 3.515869140625, 3.64862060546875, 3.7813720703125, 3.91412353515625, 4.046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 10.0, 16.0, 11.0, 11.0, 23.0, 25.0, 40.0, 43.0, 46.0, 35.0, 49.0, 54.0, 59.0, 34.0, 53.0, 46.0, 47.0, 47.0, 45.0, 38.0, 45.0, 33.0, 32.0, 21.0, 18.0, 15.0, 15.0, 9.0, 18.0, 6.0, 9.0, 9.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.12481689453125, -4.9449462890625, -4.76507568359375, -4.585205078125, -4.40533447265625, -4.2254638671875, -4.04559326171875, -3.86572265625, -3.68585205078125, -3.5059814453125, -3.32611083984375, -3.146240234375, -2.96636962890625, -2.7864990234375, -2.60662841796875, -2.4267578125, -2.24688720703125, -2.0670166015625, -1.88714599609375, -1.707275390625, -1.52740478515625, -1.3475341796875, -1.16766357421875, -0.98779296875, -0.80792236328125, -0.6280517578125, -0.44818115234375, -0.268310546875, -0.08843994140625, 0.0914306640625, 0.27130126953125, 0.451171875, 0.63104248046875, 0.8109130859375, 0.99078369140625, 1.170654296875, 1.35052490234375, 1.5303955078125, 1.71026611328125, 1.89013671875, 2.07000732421875, 2.2498779296875, 2.42974853515625, 2.609619140625, 2.78948974609375, 2.9693603515625, 3.14923095703125, 3.3291015625, 3.50897216796875, 3.6888427734375, 3.86871337890625, 4.048583984375, 4.22845458984375, 4.4083251953125, 4.58819580078125, 4.76806640625, 4.94793701171875, 5.1278076171875, 5.30767822265625, 5.487548828125, 5.66741943359375, 5.8472900390625, 6.02716064453125, 6.20703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 12.0, 11.0, 25.0, 39.0, 43.0, 74.0, 93.0, 152.0, 228.0, 344.0, 521.0, 955.0, 1614.0, 3000.0, 6375.0, 17497.0, 65236.0, 344082.0, 506201.0, 69536.0, 18518.0, 6686.0, 3085.0, 1648.0, 936.0, 561.0, 365.0, 255.0, 145.0, 94.0, 71.0, 57.0, 27.0, 22.0, 12.0, 7.0, 11.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.130859375, -1.0944061279296875, -1.057952880859375, -1.0214996337890625, -0.98504638671875, -0.9485931396484375, -0.912139892578125, -0.8756866455078125, -0.8392333984375, -0.8027801513671875, -0.766326904296875, -0.7298736572265625, -0.69342041015625, -0.6569671630859375, -0.620513916015625, -0.5840606689453125, -0.547607421875, -0.5111541748046875, -0.474700927734375, -0.4382476806640625, -0.40179443359375, -0.3653411865234375, -0.328887939453125, -0.2924346923828125, -0.2559814453125, -0.2195281982421875, -0.183074951171875, -0.1466217041015625, -0.11016845703125, -0.0737152099609375, -0.037261962890625, -0.0008087158203125, 0.03564453125, 0.0720977783203125, 0.108551025390625, 0.1450042724609375, 0.18145751953125, 0.2179107666015625, 0.254364013671875, 0.2908172607421875, 0.3272705078125, 0.3637237548828125, 0.400177001953125, 0.4366302490234375, 0.47308349609375, 0.5095367431640625, 0.545989990234375, 0.5824432373046875, 0.618896484375, 0.6553497314453125, 0.691802978515625, 0.7282562255859375, 0.76470947265625, 0.8011627197265625, 0.837615966796875, 0.8740692138671875, 0.9105224609375, 0.9469757080078125, 0.983428955078125, 1.0198822021484375, 1.05633544921875, 1.0927886962890625, 1.129241943359375, 1.1656951904296875, 1.2021484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 12.0, 23.0, 56.0, 128.0, 256.0, 224.0, 158.0, 59.0, 28.0, 15.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006465911865234375, -0.0006243810057640076, -0.0006021708250045776, -0.0005799606442451477, -0.0005577504634857178, -0.0005355402827262878, -0.0005133301019668579, -0.000491119921207428, -0.00046890974044799805, -0.0004466995596885681, -0.0004244893789291382, -0.00040227919816970825, -0.0003800690174102783, -0.0003578588366508484, -0.00033564865589141846, -0.0003134384751319885, -0.0002912282943725586, -0.00026901811361312866, -0.00024680793285369873, -0.0002245977520942688, -0.00020238757133483887, -0.00018017739057540894, -0.000157967209815979, -0.00013575702905654907, -0.00011354684829711914, -9.133666753768921e-05, -6.912648677825928e-05, -4.6916306018829346e-05, -2.4706125259399414e-05, -2.4959444999694824e-06, 1.971423625946045e-05, 4.192441701889038e-05, 6.413459777832031e-05, 8.634477853775024e-05, 0.00010855495929718018, 0.0001307651400566101, 0.00015297532081604004, 0.00017518550157546997, 0.0001973956823348999, 0.00021960586309432983, 0.00024181604385375977, 0.0002640262246131897, 0.00028623640537261963, 0.00030844658613204956, 0.0003306567668914795, 0.0003528669476509094, 0.00037507712841033936, 0.0003972873091697693, 0.0004194974899291992, 0.00044170767068862915, 0.0004639178514480591, 0.000486128032207489, 0.0005083382129669189, 0.0005305483937263489, 0.0005527585744857788, 0.0005749687552452087, 0.0005971789360046387, 0.0006193891167640686, 0.0006415992975234985, 0.0006638094782829285, 0.0006860196590423584, 0.0007082298398017883, 0.0007304400205612183, 0.0007526502013206482, 0.0007748603820800781]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 3.0, 8.0, 13.0, 10.0, 20.0, 37.0, 43.0, 82.0, 116.0, 199.0, 376.0, 679.0, 1332.0, 2950.0, 7163.0, 20885.0, 79165.0, 519086.0, 317865.0, 68002.0, 18632.0, 6477.0, 2692.0, 1247.0, 628.0, 307.0, 189.0, 100.0, 93.0, 45.0, 32.0, 28.0, 13.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1923828125, -1.155059814453125, -1.11773681640625, -1.080413818359375, -1.0430908203125, -1.005767822265625, -0.96844482421875, -0.931121826171875, -0.893798828125, -0.856475830078125, -0.81915283203125, -0.781829833984375, -0.7445068359375, -0.707183837890625, -0.66986083984375, -0.632537841796875, -0.59521484375, -0.557891845703125, -0.52056884765625, -0.483245849609375, -0.4459228515625, -0.408599853515625, -0.37127685546875, -0.333953857421875, -0.296630859375, -0.259307861328125, -0.22198486328125, -0.184661865234375, -0.1473388671875, -0.110015869140625, -0.07269287109375, -0.035369873046875, 0.001953125, 0.039276123046875, 0.07659912109375, 0.113922119140625, 0.1512451171875, 0.188568115234375, 0.22589111328125, 0.263214111328125, 0.300537109375, 0.337860107421875, 0.37518310546875, 0.412506103515625, 0.4498291015625, 0.487152099609375, 0.52447509765625, 0.561798095703125, 0.59912109375, 0.636444091796875, 0.67376708984375, 0.711090087890625, 0.7484130859375, 0.785736083984375, 0.82305908203125, 0.860382080078125, 0.897705078125, 0.935028076171875, 0.97235107421875, 1.009674072265625, 1.0469970703125, 1.084320068359375, 1.12164306640625, 1.158966064453125, 1.1962890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 0.0, 1.0, 6.0, 7.0, 7.0, 8.0, 12.0, 19.0, 22.0, 29.0, 39.0, 66.0, 61.0, 98.0, 104.0, 88.0, 92.0, 75.0, 66.0, 48.0, 38.0, 26.0, 16.0, 14.0, 12.0, 8.0, 6.0, 2.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.638671875, -1.5968780517578125, -1.555084228515625, -1.5132904052734375, -1.47149658203125, -1.4297027587890625, -1.387908935546875, -1.3461151123046875, -1.3043212890625, -1.2625274658203125, -1.220733642578125, -1.1789398193359375, -1.13714599609375, -1.0953521728515625, -1.053558349609375, -1.0117645263671875, -0.969970703125, -0.9281768798828125, -0.886383056640625, -0.8445892333984375, -0.80279541015625, -0.7610015869140625, -0.719207763671875, -0.6774139404296875, -0.6356201171875, -0.5938262939453125, -0.552032470703125, -0.5102386474609375, -0.46844482421875, -0.4266510009765625, -0.384857177734375, -0.3430633544921875, -0.30126953125, -0.2594757080078125, -0.217681884765625, -0.1758880615234375, -0.13409423828125, -0.0923004150390625, -0.050506591796875, -0.0087127685546875, 0.0330810546875, 0.0748748779296875, 0.116668701171875, 0.1584625244140625, 0.20025634765625, 0.2420501708984375, 0.283843994140625, 0.3256378173828125, 0.367431640625, 0.4092254638671875, 0.451019287109375, 0.4928131103515625, 0.53460693359375, 0.5764007568359375, 0.618194580078125, 0.6599884033203125, 0.7017822265625, 0.7435760498046875, 0.785369873046875, 0.8271636962890625, 0.86895751953125, 0.9107513427734375, 0.952545166015625, 0.9943389892578125, 1.0361328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 20.0, 28.0, 91.0, 196.0, 344.0, 187.0, 77.0, 27.0, 13.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.93738555908203, -60.37105941772461, -58.80473327636719, -57.23841094970703, -55.67208480834961, -54.10575866699219, -52.539432525634766, -50.973106384277344, -49.40678024291992, -47.8404541015625, -46.27412796020508, -44.707801818847656, -43.1414794921875, -41.57515335083008, -40.008827209472656, -38.442501068115234, -36.87617492675781, -35.30984878540039, -33.74352264404297, -32.17720031738281, -30.610872268676758, -29.04454803466797, -27.478221893310547, -25.911895751953125, -24.34557342529297, -22.779247283935547, -21.212923049926758, -19.646596908569336, -18.080270767211914, -16.513946533203125, -14.947620391845703, -13.381294250488281, -11.81496810913086, -10.248642921447754, -8.682316780090332, -7.115991592407227, -5.549665927886963, -3.983340263366699, -2.4170150756835938, -0.8506889343261719, 0.7156362533569336, 2.2819619178771973, 3.848287343978882, 5.414612770080566, 6.98093843460083, 8.547264099121094, 10.1135892868042, 11.679915428161621, 13.246240615844727, 14.812565803527832, 16.378890991210938, 17.94521713256836, 19.51154327392578, 21.077869415283203, 22.644193649291992, 24.210519790649414, 25.776844024658203, 27.343170166015625, 28.909494400024414, 30.475820541381836, 32.042144775390625, 33.60847091674805, 35.17479705810547, 36.74112319946289, 38.30744934082031]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 7.0, 8.0, 10.0, 11.0, 12.0, 18.0, 25.0, 26.0, 37.0, 45.0, 36.0, 49.0, 53.0, 80.0, 97.0, 88.0, 85.0, 52.0, 39.0, 36.0, 33.0, 22.0, 31.0, 20.0, 20.0, 15.0, 13.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.187742233276367, -18.34599494934082, -17.504247665405273, -16.662500381469727, -15.82075309753418, -14.979005813598633, -14.137258529663086, -13.295511245727539, -12.453763961791992, -11.612016677856445, -10.770269393920898, -9.928522109985352, -9.086774826049805, -8.245027542114258, -7.403280258178711, -6.561532974243164, -5.719785690307617, -4.87803840637207, -4.036291122436523, -3.1945438385009766, -2.3527965545654297, -1.5110492706298828, -0.6693019866943359, 0.17244529724121094, 1.0141925811767578, 1.8559398651123047, 2.6976871490478516, 3.5394344329833984, 4.381181716918945, 5.222929000854492, 6.064676284790039, 6.906423568725586, 7.7481689453125, 8.589916229248047, 9.431663513183594, 10.27341079711914, 11.115158081054688, 11.956905364990234, 12.798652648925781, 13.640399932861328, 14.482147216796875, 15.323894500732422, 16.16564178466797, 17.007389068603516, 17.849136352539062, 18.69088363647461, 19.532630920410156, 20.374378204345703, 21.21612548828125, 22.057872772216797, 22.899620056152344, 23.74136734008789, 24.583114624023438, 25.424861907958984, 26.26660919189453, 27.108356475830078, 27.950103759765625, 28.791851043701172, 29.63359832763672, 30.475345611572266, 31.317092895507812, 32.15884017944336, 33.000587463378906, 33.84233474731445, 34.68408203125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 12.0, 19.0, 18.0, 42.0, 44.0, 83.0, 101.0, 169.0, 218.0, 315.0, 504.0, 899.0, 1464.0, 2359.0, 4649.0, 9910.0, 24718.0, 77978.0, 319244.0, 1351320.0, 1766108.0, 472550.0, 107408.0, 30761.0, 11419.0, 5220.0, 2620.0, 1461.0, 886.0, 584.0, 369.0, 242.0, 168.0, 118.0, 87.0, 46.0, 59.0, 22.0, 27.0, 16.0, 13.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.4267578125, -1.38494873046875, -1.3431396484375, -1.30133056640625, -1.259521484375, -1.21771240234375, -1.1759033203125, -1.13409423828125, -1.09228515625, -1.05047607421875, -1.0086669921875, -0.96685791015625, -0.925048828125, -0.88323974609375, -0.8414306640625, -0.79962158203125, -0.7578125, -0.71600341796875, -0.6741943359375, -0.63238525390625, -0.590576171875, -0.54876708984375, -0.5069580078125, -0.46514892578125, -0.42333984375, -0.38153076171875, -0.3397216796875, -0.29791259765625, -0.256103515625, -0.21429443359375, -0.1724853515625, -0.13067626953125, -0.0888671875, -0.04705810546875, -0.0052490234375, 0.03656005859375, 0.078369140625, 0.12017822265625, 0.1619873046875, 0.20379638671875, 0.24560546875, 0.28741455078125, 0.3292236328125, 0.37103271484375, 0.412841796875, 0.45465087890625, 0.4964599609375, 0.53826904296875, 0.580078125, 0.62188720703125, 0.6636962890625, 0.70550537109375, 0.747314453125, 0.78912353515625, 0.8309326171875, 0.87274169921875, 0.91455078125, 0.95635986328125, 0.9981689453125, 1.03997802734375, 1.081787109375, 1.12359619140625, 1.1654052734375, 1.20721435546875, 1.2490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 8.0, 5.0, 14.0, 21.0, 29.0, 22.0, 29.0, 33.0, 50.0, 43.0, 38.0, 53.0, 52.0, 49.0, 69.0, 61.0, 54.0, 40.0, 37.0, 43.0, 31.0, 32.0, 44.0, 21.0, 24.0, 13.0, 22.0, 12.0, 3.0, 6.0, 9.0, 6.0, 0.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.2168731689453125, -1.167144775390625, -1.1174163818359375, -1.06768798828125, -1.0179595947265625, -0.968231201171875, -0.9185028076171875, -0.8687744140625, -0.8190460205078125, -0.769317626953125, -0.7195892333984375, -0.66986083984375, -0.6201324462890625, -0.570404052734375, -0.5206756591796875, -0.470947265625, -0.4212188720703125, -0.371490478515625, -0.3217620849609375, -0.27203369140625, -0.2223052978515625, -0.172576904296875, -0.1228485107421875, -0.0731201171875, -0.0233917236328125, 0.026336669921875, 0.0760650634765625, 0.12579345703125, 0.1755218505859375, 0.225250244140625, 0.2749786376953125, 0.32470703125, 0.3744354248046875, 0.424163818359375, 0.4738922119140625, 0.52362060546875, 0.5733489990234375, 0.623077392578125, 0.6728057861328125, 0.7225341796875, 0.7722625732421875, 0.821990966796875, 0.8717193603515625, 0.92144775390625, 0.9711761474609375, 1.020904541015625, 1.0706329345703125, 1.120361328125, 1.1700897216796875, 1.219818115234375, 1.2695465087890625, 1.31927490234375, 1.3690032958984375, 1.418731689453125, 1.4684600830078125, 1.5181884765625, 1.5679168701171875, 1.617645263671875, 1.6673736572265625, 1.71710205078125, 1.7668304443359375, 1.816558837890625, 1.8662872314453125, 1.916015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 7.0, 18.0, 48.0, 69.0, 144.0, 400.0, 1566.0, 10428.0, 630114.0, 3524817.0, 23333.0, 2340.0, 568.0, 226.0, 87.0, 47.0, 16.0, 13.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.04473876953125, -5.8043212890625, -5.56390380859375, -5.323486328125, -5.08306884765625, -4.8426513671875, -4.60223388671875, -4.36181640625, -4.12139892578125, -3.8809814453125, -3.64056396484375, -3.400146484375, -3.15972900390625, -2.9193115234375, -2.67889404296875, -2.4384765625, -2.19805908203125, -1.9576416015625, -1.71722412109375, -1.476806640625, -1.23638916015625, -0.9959716796875, -0.75555419921875, -0.51513671875, -0.27471923828125, -0.0343017578125, 0.20611572265625, 0.446533203125, 0.68695068359375, 0.9273681640625, 1.16778564453125, 1.408203125, 1.64862060546875, 1.8890380859375, 2.12945556640625, 2.369873046875, 2.61029052734375, 2.8507080078125, 3.09112548828125, 3.33154296875, 3.57196044921875, 3.8123779296875, 4.05279541015625, 4.293212890625, 4.53363037109375, 4.7740478515625, 5.01446533203125, 5.2548828125, 5.49530029296875, 5.7357177734375, 5.97613525390625, 6.216552734375, 6.45697021484375, 6.6973876953125, 6.93780517578125, 7.17822265625, 7.41864013671875, 7.6590576171875, 7.89947509765625, 8.139892578125, 8.38031005859375, 8.6207275390625, 8.86114501953125, 9.1015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 11.0, 15.0, 38.0, 63.0, 84.0, 175.0, 357.0, 826.0, 1047.0, 724.0, 356.0, 152.0, 82.0, 32.0, 35.0, 23.0, 14.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.2237548828125, -5.076416015625, -4.9290771484375, -4.78173828125, -4.6343994140625, -4.487060546875, -4.3397216796875, -4.1923828125, -4.0450439453125, -3.897705078125, -3.7503662109375, -3.60302734375, -3.4556884765625, -3.308349609375, -3.1610107421875, -3.013671875, -2.8663330078125, -2.718994140625, -2.5716552734375, -2.42431640625, -2.2769775390625, -2.129638671875, -1.9822998046875, -1.8349609375, -1.6876220703125, -1.540283203125, -1.3929443359375, -1.24560546875, -1.0982666015625, -0.950927734375, -0.8035888671875, -0.65625, -0.5089111328125, -0.361572265625, -0.2142333984375, -0.06689453125, 0.0804443359375, 0.227783203125, 0.3751220703125, 0.5224609375, 0.6697998046875, 0.817138671875, 0.9644775390625, 1.11181640625, 1.2591552734375, 1.406494140625, 1.5538330078125, 1.701171875, 1.8485107421875, 1.995849609375, 2.1431884765625, 2.29052734375, 2.4378662109375, 2.585205078125, 2.7325439453125, 2.8798828125, 3.0272216796875, 3.174560546875, 3.3218994140625, 3.46923828125, 3.6165771484375, 3.763916015625, 3.9112548828125, 4.05859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 5.0, 11.0, 34.0, 48.0, 117.0, 165.0, 220.0, 179.0, 100.0, 64.0, 31.0, 18.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.15801239013672, -34.08146286010742, -33.00490951538086, -31.928359985351562, -30.851810455322266, -29.775259017944336, -28.698707580566406, -27.62215805053711, -26.54560661315918, -25.46905517578125, -24.392505645751953, -23.315954208374023, -22.239402770996094, -21.162853240966797, -20.086301803588867, -19.009750366210938, -17.93320083618164, -16.85664939880371, -15.780099868774414, -14.703548431396484, -13.626997947692871, -12.550447463989258, -11.473896026611328, -10.397345542907715, -9.320795059204102, -8.244244575500488, -7.167693614959717, -6.091142654418945, -5.014592170715332, -3.9380416870117188, -2.8614907264709473, -1.7849397659301758, -0.7083930969238281, 0.36815762519836426, 1.4447083473205566, 2.521259069442749, 3.5978097915649414, 4.674360275268555, 5.750911235809326, 6.827462196350098, 7.904012680053711, 8.980563163757324, 10.057113647460938, 11.133665084838867, 12.21021556854248, 13.286766052246094, 14.363317489624023, 15.439867973327637, 16.51641845703125, 17.59296989440918, 18.669519424438477, 19.746070861816406, 20.822620391845703, 21.899171829223633, 22.975723266601562, 24.05227279663086, 25.12882423400879, 26.20537567138672, 27.281925201416016, 28.358476638793945, 29.435028076171875, 30.511577606201172, 31.5881290435791, 32.66468048095703, 33.74123001098633]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 13.0, 12.0, 12.0, 12.0, 13.0, 17.0, 21.0, 25.0, 19.0, 30.0, 43.0, 47.0, 34.0, 42.0, 63.0, 55.0, 45.0, 64.0, 56.0, 50.0, 51.0, 31.0, 32.0, 36.0, 23.0, 21.0, 22.0, 16.0, 16.0, 20.0, 6.0, 12.0, 4.0, 6.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.210481643676758, -13.767874717712402, -13.325267791748047, -12.882659912109375, -12.44005298614502, -11.997446060180664, -11.554838180541992, -11.112231254577637, -10.669624328613281, -10.227017402648926, -9.78441047668457, -9.341802597045898, -8.899195671081543, -8.456588745117188, -8.013980865478516, -7.57137393951416, -7.128767013549805, -6.686160087585449, -6.2435526847839355, -5.800945281982422, -5.358338356018066, -4.915731430053711, -4.473124027252197, -4.030516624450684, -3.587909698486328, -3.1453025341033936, -2.702695369720459, -2.2600882053375244, -1.8174810409545898, -1.3748738765716553, -0.9322667121887207, -0.48965954780578613, -0.04705238342285156, 0.395554780960083, 0.8381619453430176, 1.2807691097259521, 1.7233762741088867, 2.1659834384918213, 2.608590602874756, 3.0511977672576904, 3.493804931640625, 3.9364120960235596, 4.379019260406494, 4.821626663208008, 5.264233589172363, 5.706840515136719, 6.149447917938232, 6.592055320739746, 7.034662246704102, 7.477269172668457, 7.919876575469971, 8.362483978271484, 8.80509090423584, 9.247697830200195, 9.690305709838867, 10.132912635803223, 10.575519561767578, 11.018126487731934, 11.460733413696289, 11.903341293334961, 12.345948219299316, 12.788555145263672, 13.231163024902344, 13.6737699508667, 14.116376876831055]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 15.0, 25.0, 35.0, 48.0, 88.0, 148.0, 255.0, 419.0, 757.0, 1368.0, 2460.0, 4650.0, 9407.0, 20036.0, 45955.0, 114638.0, 271053.0, 317387.0, 151068.0, 59733.0, 25139.0, 11614.0, 5588.0, 3022.0, 1557.0, 873.0, 502.0, 290.0, 161.0, 100.0, 55.0, 35.0, 34.0, 14.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.598480224609375, -1.54168701171875, -1.484893798828125, -1.4281005859375, -1.371307373046875, -1.31451416015625, -1.257720947265625, -1.200927734375, -1.144134521484375, -1.08734130859375, -1.030548095703125, -0.9737548828125, -0.916961669921875, -0.86016845703125, -0.803375244140625, -0.74658203125, -0.689788818359375, -0.63299560546875, -0.576202392578125, -0.5194091796875, -0.462615966796875, -0.40582275390625, -0.349029541015625, -0.292236328125, -0.235443115234375, -0.17864990234375, -0.121856689453125, -0.0650634765625, -0.008270263671875, 0.04852294921875, 0.105316162109375, 0.162109375, 0.218902587890625, 0.27569580078125, 0.332489013671875, 0.3892822265625, 0.446075439453125, 0.50286865234375, 0.559661865234375, 0.616455078125, 0.673248291015625, 0.73004150390625, 0.786834716796875, 0.8436279296875, 0.900421142578125, 0.95721435546875, 1.014007568359375, 1.07080078125, 1.127593994140625, 1.18438720703125, 1.241180419921875, 1.2979736328125, 1.354766845703125, 1.41156005859375, 1.468353271484375, 1.525146484375, 1.581939697265625, 1.63873291015625, 1.695526123046875, 1.7523193359375, 1.809112548828125, 1.86590576171875, 1.922698974609375, 1.9794921875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 3.0, 2.0, 12.0, 13.0, 15.0, 16.0, 18.0, 25.0, 31.0, 35.0, 31.0, 37.0, 46.0, 44.0, 56.0, 58.0, 52.0, 63.0, 60.0, 38.0, 46.0, 35.0, 40.0, 27.0, 36.0, 26.0, 26.0, 25.0, 23.0, 16.0, 16.0, 7.0, 6.0, 6.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.36785888671875, -1.3157958984375, -1.26373291015625, -1.211669921875, -1.15960693359375, -1.1075439453125, -1.05548095703125, -1.00341796875, -0.95135498046875, -0.8992919921875, -0.84722900390625, -0.795166015625, -0.74310302734375, -0.6910400390625, -0.63897705078125, -0.5869140625, -0.53485107421875, -0.4827880859375, -0.43072509765625, -0.378662109375, -0.32659912109375, -0.2745361328125, -0.22247314453125, -0.17041015625, -0.11834716796875, -0.0662841796875, -0.01422119140625, 0.037841796875, 0.08990478515625, 0.1419677734375, 0.19403076171875, 0.24609375, 0.29815673828125, 0.3502197265625, 0.40228271484375, 0.454345703125, 0.50640869140625, 0.5584716796875, 0.61053466796875, 0.66259765625, 0.71466064453125, 0.7667236328125, 0.81878662109375, 0.870849609375, 0.92291259765625, 0.9749755859375, 1.02703857421875, 1.0791015625, 1.13116455078125, 1.1832275390625, 1.23529052734375, 1.287353515625, 1.33941650390625, 1.3914794921875, 1.44354248046875, 1.49560546875, 1.54766845703125, 1.5997314453125, 1.65179443359375, 1.703857421875, 1.75592041015625, 1.8079833984375, 1.86004638671875, 1.912109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 5.0, 14.0, 19.0, 28.0, 52.0, 81.0, 124.0, 196.0, 357.0, 778.0, 2328.0, 11402.0, 144018.0, 831095.0, 49557.0, 5737.0, 1481.0, 570.0, 253.0, 160.0, 89.0, 82.0, 42.0, 27.0, 24.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.1331787109375, -4.930419921875, -4.7276611328125, -4.52490234375, -4.3221435546875, -4.119384765625, -3.9166259765625, -3.7138671875, -3.5111083984375, -3.308349609375, -3.1055908203125, -2.90283203125, -2.7000732421875, -2.497314453125, -2.2945556640625, -2.091796875, -1.8890380859375, -1.686279296875, -1.4835205078125, -1.28076171875, -1.0780029296875, -0.875244140625, -0.6724853515625, -0.4697265625, -0.2669677734375, -0.064208984375, 0.1385498046875, 0.34130859375, 0.5440673828125, 0.746826171875, 0.9495849609375, 1.15234375, 1.3551025390625, 1.557861328125, 1.7606201171875, 1.96337890625, 2.1661376953125, 2.368896484375, 2.5716552734375, 2.7744140625, 2.9771728515625, 3.179931640625, 3.3826904296875, 3.58544921875, 3.7882080078125, 3.990966796875, 4.1937255859375, 4.396484375, 4.5992431640625, 4.802001953125, 5.0047607421875, 5.20751953125, 5.4102783203125, 5.613037109375, 5.8157958984375, 6.0185546875, 6.2213134765625, 6.424072265625, 6.6268310546875, 6.82958984375, 7.0323486328125, 7.235107421875, 7.4378662109375, 7.640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 8.0, 15.0, 9.0, 25.0, 16.0, 36.0, 36.0, 37.0, 47.0, 42.0, 53.0, 69.0, 76.0, 82.0, 61.0, 72.0, 54.0, 59.0, 41.0, 41.0, 18.0, 19.0, 18.0, 14.0, 10.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.57305908203125, -6.3297119140625, -6.08636474609375, -5.843017578125, -5.59967041015625, -5.3563232421875, -5.11297607421875, -4.86962890625, -4.62628173828125, -4.3829345703125, -4.13958740234375, -3.896240234375, -3.65289306640625, -3.4095458984375, -3.16619873046875, -2.9228515625, -2.67950439453125, -2.4361572265625, -2.19281005859375, -1.949462890625, -1.70611572265625, -1.4627685546875, -1.21942138671875, -0.97607421875, -0.73272705078125, -0.4893798828125, -0.24603271484375, -0.002685546875, 0.24066162109375, 0.4840087890625, 0.72735595703125, 0.970703125, 1.21405029296875, 1.4573974609375, 1.70074462890625, 1.944091796875, 2.18743896484375, 2.4307861328125, 2.67413330078125, 2.91748046875, 3.16082763671875, 3.4041748046875, 3.64752197265625, 3.890869140625, 4.13421630859375, 4.3775634765625, 4.62091064453125, 4.8642578125, 5.10760498046875, 5.3509521484375, 5.59429931640625, 5.837646484375, 6.08099365234375, 6.3243408203125, 6.56768798828125, 6.81103515625, 7.05438232421875, 7.2977294921875, 7.54107666015625, 7.784423828125, 8.02777099609375, 8.2711181640625, 8.51446533203125, 8.7578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 10.0, 10.0, 16.0, 18.0, 32.0, 48.0, 55.0, 89.0, 114.0, 229.0, 365.0, 668.0, 1236.0, 2589.0, 6101.0, 17402.0, 64899.0, 649301.0, 241469.0, 42044.0, 12585.0, 4787.0, 2068.0, 955.0, 560.0, 316.0, 204.0, 113.0, 67.0, 59.0, 33.0, 30.0, 8.0, 15.0, 15.0, 9.0, 5.0, 8.0, 3.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0947265625, -1.0614013671875, -1.028076171875, -0.9947509765625, -0.96142578125, -0.9281005859375, -0.894775390625, -0.8614501953125, -0.828125, -0.7947998046875, -0.761474609375, -0.7281494140625, -0.69482421875, -0.6614990234375, -0.628173828125, -0.5948486328125, -0.5615234375, -0.5281982421875, -0.494873046875, -0.4615478515625, -0.42822265625, -0.3948974609375, -0.361572265625, -0.3282470703125, -0.294921875, -0.2615966796875, -0.228271484375, -0.1949462890625, -0.16162109375, -0.1282958984375, -0.094970703125, -0.0616455078125, -0.0283203125, 0.0050048828125, 0.038330078125, 0.0716552734375, 0.10498046875, 0.1383056640625, 0.171630859375, 0.2049560546875, 0.23828125, 0.2716064453125, 0.304931640625, 0.3382568359375, 0.37158203125, 0.4049072265625, 0.438232421875, 0.4715576171875, 0.5048828125, 0.5382080078125, 0.571533203125, 0.6048583984375, 0.63818359375, 0.6715087890625, 0.704833984375, 0.7381591796875, 0.771484375, 0.8048095703125, 0.838134765625, 0.8714599609375, 0.90478515625, 0.9381103515625, 0.971435546875, 1.0047607421875, 1.0380859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 9.0, 6.0, 7.0, 11.0, 19.0, 18.0, 32.0, 52.0, 83.0, 163.0, 179.0, 153.0, 81.0, 55.0, 32.0, 28.0, 21.0, 11.0, 5.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003819465637207031, -0.0003694407641887665, -0.00035693496465682983, -0.0003444291651248932, -0.00033192336559295654, -0.0003194175660610199, -0.00030691176652908325, -0.0002944059669971466, -0.00028190016746520996, -0.0002693943679332733, -0.00025688856840133667, -0.0002443827688694, -0.00023187696933746338, -0.00021937116980552673, -0.0002068653702735901, -0.00019435957074165344, -0.0001818537712097168, -0.00016934797167778015, -0.0001568421721458435, -0.00014433637261390686, -0.00013183057308197021, -0.00011932477355003357, -0.00010681897401809692, -9.431317448616028e-05, -8.180737495422363e-05, -6.930157542228699e-05, -5.679577589035034e-05, -4.4289976358413696e-05, -3.178417682647705e-05, -1.9278377294540405e-05, -6.77257776260376e-06, 5.733221769332886e-06, 1.823902130126953e-05, 3.074482083320618e-05, 4.325062036514282e-05, 5.575641989707947e-05, 6.826221942901611e-05, 8.076801896095276e-05, 9.32738184928894e-05, 0.00010577961802482605, 0.0001182854175567627, 0.00013079121708869934, 0.00014329701662063599, 0.00015580281615257263, 0.00016830861568450928, 0.00018081441521644592, 0.00019332021474838257, 0.00020582601428031921, 0.00021833181381225586, 0.0002308376133441925, 0.00024334341287612915, 0.0002558492124080658, 0.00026835501194000244, 0.0002808608114719391, 0.00029336661100387573, 0.0003058724105358124, 0.000318378210067749, 0.00033088400959968567, 0.0003433898091316223, 0.00035589560866355896, 0.0003684014081954956, 0.00038090720772743225, 0.0003934130072593689, 0.00040591880679130554, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 3.0, 9.0, 9.0, 17.0, 18.0, 17.0, 22.0, 38.0, 48.0, 73.0, 99.0, 152.0, 286.0, 439.0, 687.0, 1379.0, 2646.0, 5924.0, 15234.0, 44145.0, 173070.0, 639764.0, 111210.0, 31990.0, 11600.0, 4651.0, 2276.0, 1046.0, 576.0, 380.0, 240.0, 151.0, 94.0, 71.0, 50.0, 37.0, 25.0, 18.0, 9.0, 15.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.8642578125, -0.8375473022460938, -0.8108367919921875, -0.7841262817382812, -0.757415771484375, -0.7307052612304688, -0.7039947509765625, -0.6772842407226562, -0.65057373046875, -0.6238632202148438, -0.5971527099609375, -0.5704421997070312, -0.543731689453125, -0.5170211791992188, -0.4903106689453125, -0.46360015869140625, -0.4368896484375, -0.41017913818359375, -0.3834686279296875, -0.35675811767578125, -0.330047607421875, -0.30333709716796875, -0.2766265869140625, -0.24991607666015625, -0.22320556640625, -0.19649505615234375, -0.1697845458984375, -0.14307403564453125, -0.116363525390625, -0.08965301513671875, -0.0629425048828125, -0.03623199462890625, -0.009521484375, 0.01718902587890625, 0.0438995361328125, 0.07061004638671875, 0.097320556640625, 0.12403106689453125, 0.1507415771484375, 0.17745208740234375, 0.20416259765625, 0.23087310791015625, 0.2575836181640625, 0.28429412841796875, 0.311004638671875, 0.33771514892578125, 0.3644256591796875, 0.39113616943359375, 0.4178466796875, 0.44455718994140625, 0.4712677001953125, 0.49797821044921875, 0.524688720703125, 0.5513992309570312, 0.5781097412109375, 0.6048202514648438, 0.63153076171875, 0.6582412719726562, 0.6849517822265625, 0.7116622924804688, 0.738372802734375, 0.7650833129882812, 0.7917938232421875, 0.8185043334960938, 0.84521484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 7.0, 9.0, 10.0, 14.0, 15.0, 8.0, 14.0, 23.0, 34.0, 32.0, 60.0, 65.0, 61.0, 107.0, 87.0, 90.0, 70.0, 61.0, 26.0, 32.0, 28.0, 22.0, 20.0, 12.0, 12.0, 14.0, 8.0, 1.0, 5.0, 9.0, 7.0, 8.0, 5.0, 1.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9130706787109375, -0.883758544921875, -0.8544464111328125, -0.82513427734375, -0.7958221435546875, -0.766510009765625, -0.7371978759765625, -0.7078857421875, -0.6785736083984375, -0.649261474609375, -0.6199493408203125, -0.59063720703125, -0.5613250732421875, -0.532012939453125, -0.5027008056640625, -0.473388671875, -0.4440765380859375, -0.414764404296875, -0.3854522705078125, -0.35614013671875, -0.3268280029296875, -0.297515869140625, -0.2682037353515625, -0.2388916015625, -0.2095794677734375, -0.180267333984375, -0.1509552001953125, -0.12164306640625, -0.0923309326171875, -0.063018798828125, -0.0337066650390625, -0.00439453125, 0.0249176025390625, 0.054229736328125, 0.0835418701171875, 0.11285400390625, 0.1421661376953125, 0.171478271484375, 0.2007904052734375, 0.2301025390625, 0.2594146728515625, 0.288726806640625, 0.3180389404296875, 0.34735107421875, 0.3766632080078125, 0.405975341796875, 0.4352874755859375, 0.464599609375, 0.4939117431640625, 0.523223876953125, 0.5525360107421875, 0.58184814453125, 0.6111602783203125, 0.640472412109375, 0.6697845458984375, 0.6990966796875, 0.7284088134765625, 0.757720947265625, 0.7870330810546875, 0.81634521484375, 0.8456573486328125, 0.874969482421875, 0.9042816162109375, 0.93359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 8.0, 6.0, 32.0, 98.0, 235.0, 436.0, 125.0, 44.0, 13.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.7462158203125, -71.06510925292969, -69.38400268554688, -67.70289611816406, -66.02178955078125, -64.34068298339844, -62.659576416015625, -60.97846984863281, -59.29736328125, -57.61625671386719, -55.935150146484375, -54.25404357910156, -52.57293701171875, -50.89183044433594, -49.210723876953125, -47.52961730957031, -45.848514556884766, -44.16740798950195, -42.48630142211914, -40.80519485473633, -39.124088287353516, -37.4429817199707, -35.761878967285156, -34.080772399902344, -32.39966583251953, -30.71855926513672, -29.037452697753906, -27.356346130371094, -25.67523956298828, -23.99413299560547, -22.31302833557129, -20.631921768188477, -18.950809478759766, -17.269702911376953, -15.58859634399414, -13.907490730285645, -12.226384162902832, -10.54527759552002, -8.864171981811523, -7.183065414428711, -5.501958847045898, -3.820852518081665, -2.1397461891174316, -0.45864009857177734, 1.2224664688110352, 2.9035730361938477, 4.584678649902344, 6.265785217285156, 7.946891784667969, 9.627998352050781, 11.309104919433594, 12.99021053314209, 14.671317100524902, 16.35242462158203, 18.03352928161621, 19.714635848999023, 21.395742416381836, 23.07684898376465, 24.75795555114746, 26.43906021118164, 28.120166778564453, 29.801273345947266, 31.482379913330078, 33.16348648071289, 34.8445930480957]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 9.0, 10.0, 7.0, 8.0, 8.0, 8.0, 17.0, 15.0, 21.0, 18.0, 24.0, 20.0, 29.0, 38.0, 36.0, 36.0, 57.0, 78.0, 79.0, 82.0, 51.0, 27.0, 34.0, 31.0, 36.0, 22.0, 22.0, 21.0, 16.0, 17.0, 19.0, 11.0, 16.0, 14.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.586380004882812, -19.02099609375, -18.455612182617188, -17.890228271484375, -17.324844360351562, -16.75946044921875, -16.194076538085938, -15.628693580627441, -15.063309669494629, -14.497925758361816, -13.932541847229004, -13.367157936096191, -12.801774978637695, -12.236391067504883, -11.67100715637207, -11.105623245239258, -10.540239334106445, -9.974855422973633, -9.40947151184082, -8.844087600708008, -8.278703689575195, -7.713320255279541, -7.147936820983887, -6.582552909851074, -6.017168998718262, -5.451785087585449, -4.886401176452637, -4.321017742156982, -3.75563383102417, -3.1902499198913574, -2.624866247177124, -2.0594825744628906, -1.4940986633300781, -0.9287148714065552, -0.3633310794830322, 0.20205271244049072, 0.7674365043640137, 1.3328204154968262, 1.8982040882110596, 2.463587760925293, 3.0289716720581055, 3.594355583190918, 4.1597394943237305, 4.725122928619385, 5.290506839752197, 5.85589075088501, 6.421274185180664, 6.986658096313477, 7.552042007446289, 8.117425918579102, 8.682809829711914, 9.248193740844727, 9.813577651977539, 10.378961563110352, 10.944344520568848, 11.50972843170166, 12.075112342834473, 12.640496253967285, 13.205880165100098, 13.77126407623291, 14.336647033691406, 14.902030944824219, 15.467414855957031, 16.032798767089844, 16.598182678222656]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 12.0, 30.0, 24.0, 37.0, 74.0, 115.0, 118.0, 226.0, 344.0, 550.0, 967.0, 1677.0, 2992.0, 5797.0, 12573.0, 32298.0, 100127.0, 379982.0, 1376744.0, 1623772.0, 473419.0, 119078.0, 35896.0, 13466.0, 6291.0, 3196.0, 1721.0, 1028.0, 617.0, 393.0, 228.0, 151.0, 105.0, 68.0, 49.0, 32.0, 21.0, 17.0, 9.0, 11.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.427734375, -1.3832244873046875, -1.338714599609375, -1.2942047119140625, -1.24969482421875, -1.2051849365234375, -1.160675048828125, -1.1161651611328125, -1.0716552734375, -1.0271453857421875, -0.982635498046875, -0.9381256103515625, -0.89361572265625, -0.8491058349609375, -0.804595947265625, -0.7600860595703125, -0.715576171875, -0.6710662841796875, -0.626556396484375, -0.5820465087890625, -0.53753662109375, -0.4930267333984375, -0.448516845703125, -0.4040069580078125, -0.3594970703125, -0.3149871826171875, -0.270477294921875, -0.2259674072265625, -0.18145751953125, -0.1369476318359375, -0.092437744140625, -0.0479278564453125, -0.00341796875, 0.0410919189453125, 0.085601806640625, 0.1301116943359375, 0.17462158203125, 0.2191314697265625, 0.263641357421875, 0.3081512451171875, 0.3526611328125, 0.3971710205078125, 0.441680908203125, 0.4861907958984375, 0.53070068359375, 0.5752105712890625, 0.619720458984375, 0.6642303466796875, 0.708740234375, 0.7532501220703125, 0.797760009765625, 0.8422698974609375, 0.88677978515625, 0.9312896728515625, 0.975799560546875, 1.0203094482421875, 1.0648193359375, 1.1093292236328125, 1.153839111328125, 1.1983489990234375, 1.24285888671875, 1.2873687744140625, 1.331878662109375, 1.3763885498046875, 1.4208984375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 17.0, 26.0, 21.0, 27.0, 23.0, 36.0, 48.0, 35.0, 50.0, 50.0, 48.0, 44.0, 55.0, 45.0, 31.0, 46.0, 34.0, 32.0, 51.0, 38.0, 20.0, 23.0, 27.0, 20.0, 17.0, 18.0, 11.0, 9.0, 6.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.265625, -1.2212066650390625, -1.176788330078125, -1.1323699951171875, -1.08795166015625, -1.0435333251953125, -0.999114990234375, -0.9546966552734375, -0.9102783203125, -0.8658599853515625, -0.821441650390625, -0.7770233154296875, -0.73260498046875, -0.6881866455078125, -0.643768310546875, -0.5993499755859375, -0.554931640625, -0.5105133056640625, -0.466094970703125, -0.4216766357421875, -0.37725830078125, -0.3328399658203125, -0.288421630859375, -0.2440032958984375, -0.1995849609375, -0.1551666259765625, -0.110748291015625, -0.0663299560546875, -0.02191162109375, 0.0225067138671875, 0.066925048828125, 0.1113433837890625, 0.15576171875, 0.2001800537109375, 0.244598388671875, 0.2890167236328125, 0.33343505859375, 0.3778533935546875, 0.422271728515625, 0.4666900634765625, 0.5111083984375, 0.5555267333984375, 0.599945068359375, 0.6443634033203125, 0.68878173828125, 0.7332000732421875, 0.777618408203125, 0.8220367431640625, 0.866455078125, 0.9108734130859375, 0.955291748046875, 0.9997100830078125, 1.04412841796875, 1.0885467529296875, 1.132965087890625, 1.1773834228515625, 1.2218017578125, 1.2662200927734375, 1.310638427734375, 1.3550567626953125, 1.39947509765625, 1.4438934326171875, 1.488311767578125, 1.5327301025390625, 1.5771484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 8.0, 9.0, 10.0, 13.0, 23.0, 42.0, 62.0, 99.0, 156.0, 307.0, 633.0, 1810.0, 6584.0, 43980.0, 1290650.0, 2766638.0, 70142.0, 9154.0, 2260.0, 806.0, 340.0, 211.0, 105.0, 70.0, 39.0, 35.0, 20.0, 21.0, 10.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.03326416015625, -3.8946533203125, -3.75604248046875, -3.617431640625, -3.47882080078125, -3.3402099609375, -3.20159912109375, -3.06298828125, -2.92437744140625, -2.7857666015625, -2.64715576171875, -2.508544921875, -2.36993408203125, -2.2313232421875, -2.09271240234375, -1.9541015625, -1.81549072265625, -1.6768798828125, -1.53826904296875, -1.399658203125, -1.26104736328125, -1.1224365234375, -0.98382568359375, -0.84521484375, -0.70660400390625, -0.5679931640625, -0.42938232421875, -0.290771484375, -0.15216064453125, -0.0135498046875, 0.12506103515625, 0.263671875, 0.40228271484375, 0.5408935546875, 0.67950439453125, 0.818115234375, 0.95672607421875, 1.0953369140625, 1.23394775390625, 1.37255859375, 1.51116943359375, 1.6497802734375, 1.78839111328125, 1.927001953125, 2.06561279296875, 2.2042236328125, 2.34283447265625, 2.4814453125, 2.62005615234375, 2.7586669921875, 2.89727783203125, 3.035888671875, 3.17449951171875, 3.3131103515625, 3.45172119140625, 3.59033203125, 3.72894287109375, 3.8675537109375, 4.00616455078125, 4.144775390625, 4.28338623046875, 4.4219970703125, 4.56060791015625, 4.69921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 9.0, 8.0, 17.0, 18.0, 28.0, 34.0, 43.0, 72.0, 91.0, 143.0, 244.0, 384.0, 490.0, 658.0, 587.0, 425.0, 252.0, 187.0, 92.0, 72.0, 51.0, 42.0, 28.0, 21.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.904296875, -2.80645751953125, -2.7086181640625, -2.61077880859375, -2.512939453125, -2.41510009765625, -2.3172607421875, -2.21942138671875, -2.12158203125, -2.02374267578125, -1.9259033203125, -1.82806396484375, -1.730224609375, -1.63238525390625, -1.5345458984375, -1.43670654296875, -1.3388671875, -1.24102783203125, -1.1431884765625, -1.04534912109375, -0.947509765625, -0.84967041015625, -0.7518310546875, -0.65399169921875, -0.55615234375, -0.45831298828125, -0.3604736328125, -0.26263427734375, -0.164794921875, -0.06695556640625, 0.0308837890625, 0.12872314453125, 0.2265625, 0.32440185546875, 0.4222412109375, 0.52008056640625, 0.617919921875, 0.71575927734375, 0.8135986328125, 0.91143798828125, 1.00927734375, 1.10711669921875, 1.2049560546875, 1.30279541015625, 1.400634765625, 1.49847412109375, 1.5963134765625, 1.69415283203125, 1.7919921875, 1.88983154296875, 1.9876708984375, 2.08551025390625, 2.183349609375, 2.28118896484375, 2.3790283203125, 2.47686767578125, 2.57470703125, 2.67254638671875, 2.7703857421875, 2.86822509765625, 2.966064453125, 3.06390380859375, 3.1617431640625, 3.25958251953125, 3.357421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 7.0, 23.0, 41.0, 78.0, 166.0, 235.0, 189.0, 121.0, 68.0, 31.0, 12.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.62327003479004, -25.504671096801758, -24.386072158813477, -23.267473220825195, -22.148874282836914, -21.030275344848633, -19.91167449951172, -18.793075561523438, -17.674476623535156, -16.555877685546875, -15.437278747558594, -14.318679809570312, -13.200080871582031, -12.08148193359375, -10.962882041931152, -9.844283103942871, -8.725685119628906, -7.607086181640625, -6.488487243652344, -5.369887828826904, -4.251288890838623, -3.132689952850342, -2.0140905380249023, -0.8954916000366211, 0.22310733795166016, 1.341706395149231, 2.4603054523468018, 3.578904628753662, 4.697503566741943, 5.816102504730225, 6.934701919555664, 8.053300857543945, 9.171897888183594, 10.290496826171875, 11.409095764160156, 12.527694702148438, 13.646293640136719, 14.764892578125, 15.883492469787598, 17.002090454101562, 18.120689392089844, 19.239288330078125, 20.357887268066406, 21.476486206054688, 22.59508514404297, 23.71368408203125, 24.83228302001953, 25.950881958007812, 27.069482803344727, 28.188081741333008, 29.30668067932129, 30.42527961730957, 31.54387855529785, 32.662479400634766, 33.78107833862305, 34.89967727661133, 36.01827621459961, 37.13687515258789, 38.25547409057617, 39.37407302856445, 40.492671966552734, 41.611270904541016, 42.7298698425293, 43.84846878051758, 44.96706771850586]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 2.0, 3.0, 8.0, 7.0, 14.0, 16.0, 14.0, 19.0, 24.0, 25.0, 26.0, 27.0, 31.0, 49.0, 56.0, 51.0, 55.0, 58.0, 63.0, 68.0, 57.0, 48.0, 40.0, 40.0, 33.0, 33.0, 30.0, 24.0, 15.0, 18.0, 10.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.758098602294922, -17.23614501953125, -16.71419334411621, -16.192241668701172, -15.6702880859375, -15.148335456848145, -14.626382827758789, -14.104430198669434, -13.582477569580078, -13.060524940490723, -12.538572311401367, -12.016619682312012, -11.494667053222656, -10.9727144241333, -10.450761795043945, -9.92880916595459, -9.406856536865234, -8.884903907775879, -8.362951278686523, -7.840998649597168, -7.3190460205078125, -6.797093391418457, -6.275140762329102, -5.753188133239746, -5.231235504150391, -4.709282875061035, -4.18733024597168, -3.665377616882324, -3.1434249877929688, -2.6214723587036133, -2.099519729614258, -1.5775671005249023, -1.0556135177612305, -0.533660888671875, -0.011708259582519531, 0.5102443695068359, 1.0321969985961914, 1.5541496276855469, 2.0761022567749023, 2.598054885864258, 3.1200075149536133, 3.6419601440429688, 4.163912773132324, 4.68586540222168, 5.207818031311035, 5.729770660400391, 6.251723289489746, 6.773675918579102, 7.295628547668457, 7.8175811767578125, 8.339533805847168, 8.861486434936523, 9.383439064025879, 9.905391693115234, 10.42734432220459, 10.949296951293945, 11.4712495803833, 11.993202209472656, 12.515154838562012, 13.037107467651367, 13.559060096740723, 14.081012725830078, 14.602965354919434, 15.124917984008789, 15.646870613098145]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 13.0, 23.0, 37.0, 42.0, 87.0, 106.0, 207.0, 322.0, 544.0, 954.0, 1706.0, 3124.0, 6114.0, 12372.0, 26622.0, 61524.0, 152858.0, 336855.0, 260089.0, 103394.0, 43077.0, 19143.0, 9007.0, 4582.0, 2453.0, 1380.0, 789.0, 436.0, 275.0, 156.0, 91.0, 63.0, 41.0, 27.0, 16.0, 10.0, 8.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6634979248046875, -1.601409912109375, -1.5393218994140625, -1.47723388671875, -1.4151458740234375, -1.353057861328125, -1.2909698486328125, -1.2288818359375, -1.1667938232421875, -1.104705810546875, -1.0426177978515625, -0.98052978515625, -0.9184417724609375, -0.856353759765625, -0.7942657470703125, -0.732177734375, -0.6700897216796875, -0.608001708984375, -0.5459136962890625, -0.48382568359375, -0.4217376708984375, -0.359649658203125, -0.2975616455078125, -0.2354736328125, -0.1733856201171875, -0.111297607421875, -0.0492095947265625, 0.01287841796875, 0.0749664306640625, 0.137054443359375, 0.1991424560546875, 0.26123046875, 0.3233184814453125, 0.385406494140625, 0.4474945068359375, 0.50958251953125, 0.5716705322265625, 0.633758544921875, 0.6958465576171875, 0.7579345703125, 0.8200225830078125, 0.882110595703125, 0.9441986083984375, 1.00628662109375, 1.0683746337890625, 1.130462646484375, 1.1925506591796875, 1.254638671875, 1.3167266845703125, 1.378814697265625, 1.4409027099609375, 1.50299072265625, 1.5650787353515625, 1.627166748046875, 1.6892547607421875, 1.7513427734375, 1.8134307861328125, 1.875518798828125, 1.9376068115234375, 1.99969482421875, 2.0617828369140625, 2.123870849609375, 2.1859588623046875, 2.248046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 6.0, 12.0, 16.0, 24.0, 22.0, 25.0, 25.0, 30.0, 34.0, 41.0, 44.0, 46.0, 59.0, 64.0, 53.0, 47.0, 58.0, 48.0, 41.0, 38.0, 32.0, 35.0, 29.0, 22.0, 27.0, 15.0, 19.0, 11.0, 9.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5947265625, -1.545379638671875, -1.49603271484375, -1.446685791015625, -1.3973388671875, -1.347991943359375, -1.29864501953125, -1.249298095703125, -1.199951171875, -1.150604248046875, -1.10125732421875, -1.051910400390625, -1.0025634765625, -0.953216552734375, -0.90386962890625, -0.854522705078125, -0.80517578125, -0.755828857421875, -0.70648193359375, -0.657135009765625, -0.6077880859375, -0.558441162109375, -0.50909423828125, -0.459747314453125, -0.410400390625, -0.361053466796875, -0.31170654296875, -0.262359619140625, -0.2130126953125, -0.163665771484375, -0.11431884765625, -0.064971923828125, -0.015625, 0.033721923828125, 0.08306884765625, 0.132415771484375, 0.1817626953125, 0.231109619140625, 0.28045654296875, 0.329803466796875, 0.379150390625, 0.428497314453125, 0.47784423828125, 0.527191162109375, 0.5765380859375, 0.625885009765625, 0.67523193359375, 0.724578857421875, 0.77392578125, 0.823272705078125, 0.87261962890625, 0.921966552734375, 0.9713134765625, 1.020660400390625, 1.07000732421875, 1.119354248046875, 1.168701171875, 1.218048095703125, 1.26739501953125, 1.316741943359375, 1.3660888671875, 1.415435791015625, 1.46478271484375, 1.514129638671875, 1.5634765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 13.0, 15.0, 13.0, 22.0, 33.0, 40.0, 67.0, 91.0, 136.0, 157.0, 232.0, 386.0, 594.0, 1037.0, 2234.0, 5914.0, 27791.0, 259635.0, 691972.0, 44079.0, 8200.0, 2670.0, 1226.0, 659.0, 445.0, 273.0, 175.0, 136.0, 84.0, 66.0, 49.0, 32.0, 18.0, 16.0, 10.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.3505859375, -4.201171875, -4.0517578125, -3.90234375, -3.7529296875, -3.603515625, -3.4541015625, -3.3046875, -3.1552734375, -3.005859375, -2.8564453125, -2.70703125, -2.5576171875, -2.408203125, -2.2587890625, -2.109375, -1.9599609375, -1.810546875, -1.6611328125, -1.51171875, -1.3623046875, -1.212890625, -1.0634765625, -0.9140625, -0.7646484375, -0.615234375, -0.4658203125, -0.31640625, -0.1669921875, -0.017578125, 0.1318359375, 0.28125, 0.4306640625, 0.580078125, 0.7294921875, 0.87890625, 1.0283203125, 1.177734375, 1.3271484375, 1.4765625, 1.6259765625, 1.775390625, 1.9248046875, 2.07421875, 2.2236328125, 2.373046875, 2.5224609375, 2.671875, 2.8212890625, 2.970703125, 3.1201171875, 3.26953125, 3.4189453125, 3.568359375, 3.7177734375, 3.8671875, 4.0166015625, 4.166015625, 4.3154296875, 4.46484375, 4.6142578125, 4.763671875, 4.9130859375, 5.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 13.0, 4.0, 12.0, 10.0, 15.0, 11.0, 23.0, 22.0, 25.0, 37.0, 42.0, 38.0, 31.0, 51.0, 43.0, 52.0, 48.0, 51.0, 43.0, 58.0, 58.0, 39.0, 44.0, 35.0, 33.0, 26.0, 22.0, 15.0, 16.0, 12.0, 12.0, 13.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2763671875, -5.099609375, -4.9228515625, -4.74609375, -4.5693359375, -4.392578125, -4.2158203125, -4.0390625, -3.8623046875, -3.685546875, -3.5087890625, -3.33203125, -3.1552734375, -2.978515625, -2.8017578125, -2.625, -2.4482421875, -2.271484375, -2.0947265625, -1.91796875, -1.7412109375, -1.564453125, -1.3876953125, -1.2109375, -1.0341796875, -0.857421875, -0.6806640625, -0.50390625, -0.3271484375, -0.150390625, 0.0263671875, 0.203125, 0.3798828125, 0.556640625, 0.7333984375, 0.91015625, 1.0869140625, 1.263671875, 1.4404296875, 1.6171875, 1.7939453125, 1.970703125, 2.1474609375, 2.32421875, 2.5009765625, 2.677734375, 2.8544921875, 3.03125, 3.2080078125, 3.384765625, 3.5615234375, 3.73828125, 3.9150390625, 4.091796875, 4.2685546875, 4.4453125, 4.6220703125, 4.798828125, 4.9755859375, 5.15234375, 5.3291015625, 5.505859375, 5.6826171875, 5.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 14.0, 8.0, 14.0, 13.0, 16.0, 24.0, 25.0, 36.0, 49.0, 63.0, 89.0, 137.0, 217.0, 360.0, 620.0, 1129.0, 2405.0, 5864.0, 18333.0, 100814.0, 803441.0, 87452.0, 17090.0, 5459.0, 2211.0, 1070.0, 571.0, 336.0, 198.0, 136.0, 89.0, 67.0, 43.0, 26.0, 19.0, 22.0, 14.0, 10.0, 9.0, 12.0, 8.0, 11.0, 4.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.9658203125, -0.9351272583007812, -0.9044342041015625, -0.8737411499023438, -0.843048095703125, -0.8123550415039062, -0.7816619873046875, -0.7509689331054688, -0.72027587890625, -0.6895828247070312, -0.6588897705078125, -0.6281967163085938, -0.597503662109375, -0.5668106079101562, -0.5361175537109375, -0.5054244995117188, -0.4747314453125, -0.44403839111328125, -0.4133453369140625, -0.38265228271484375, -0.351959228515625, -0.32126617431640625, -0.2905731201171875, -0.25988006591796875, -0.22918701171875, -0.19849395751953125, -0.1678009033203125, -0.13710784912109375, -0.106414794921875, -0.07572174072265625, -0.0450286865234375, -0.01433563232421875, 0.016357421875, 0.04705047607421875, 0.0777435302734375, 0.10843658447265625, 0.139129638671875, 0.16982269287109375, 0.2005157470703125, 0.23120880126953125, 0.26190185546875, 0.29259490966796875, 0.3232879638671875, 0.35398101806640625, 0.384674072265625, 0.41536712646484375, 0.4460601806640625, 0.47675323486328125, 0.5074462890625, 0.5381393432617188, 0.5688323974609375, 0.5995254516601562, 0.630218505859375, 0.6609115600585938, 0.6916046142578125, 0.7222976684570312, 0.75299072265625, 0.7836837768554688, 0.8143768310546875, 0.8450698852539062, 0.875762939453125, 0.9064559936523438, 0.9371490478515625, 0.9678421020507812, 0.99853515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 6.0, 1.0, 10.0, 6.0, 14.0, 11.0, 21.0, 33.0, 65.0, 99.0, 185.0, 234.0, 119.0, 70.0, 40.0, 21.0, 18.0, 12.0, 5.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005102157592773438, -0.0004960782825946808, -0.0004819408059120178, -0.00046780332922935486, -0.0004536658525466919, -0.00043952837586402893, -0.00042539089918136597, -0.000411253422498703, -0.00039711594581604004, -0.0003829784691333771, -0.0003688409924507141, -0.00035470351576805115, -0.0003405660390853882, -0.0003264285624027252, -0.00031229108572006226, -0.0002981536090373993, -0.00028401613235473633, -0.00026987865567207336, -0.0002557411789894104, -0.00024160370230674744, -0.00022746622562408447, -0.0002133287489414215, -0.00019919127225875854, -0.00018505379557609558, -0.00017091631889343262, -0.00015677884221076965, -0.0001426413655281067, -0.00012850388884544373, -0.00011436641216278076, -0.0001002289354801178, -8.609145879745483e-05, -7.195398211479187e-05, -5.7816505432128906e-05, -4.367902874946594e-05, -2.954155206680298e-05, -1.5404075384140015e-05, -1.2665987014770508e-06, 1.2870877981185913e-05, 2.7008354663848877e-05, 4.114583134651184e-05, 5.5283308029174805e-05, 6.942078471183777e-05, 8.355826139450073e-05, 9.76957380771637e-05, 0.00011183321475982666, 0.00012597069144248962, 0.0001401081681251526, 0.00015424564480781555, 0.00016838312149047852, 0.00018252059817314148, 0.00019665807485580444, 0.0002107955515384674, 0.00022493302822113037, 0.00023907050490379333, 0.0002532079815864563, 0.00026734545826911926, 0.0002814829349517822, 0.0002956204116344452, 0.00030975788831710815, 0.0003238953649997711, 0.0003380328416824341, 0.00035217031836509705, 0.00036630779504776, 0.000380445271730423, 0.00039458274841308594]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 13.0, 11.0, 8.0, 18.0, 28.0, 36.0, 50.0, 78.0, 128.0, 207.0, 395.0, 624.0, 1321.0, 2905.0, 8016.0, 30065.0, 205953.0, 718225.0, 59230.0, 13203.0, 4304.0, 1711.0, 857.0, 457.0, 231.0, 169.0, 98.0, 75.0, 36.0, 29.0, 22.0, 8.0, 13.0, 10.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9812469482421875, -0.949798583984375, -0.9183502197265625, -0.88690185546875, -0.8554534912109375, -0.824005126953125, -0.7925567626953125, -0.7611083984375, -0.7296600341796875, -0.698211669921875, -0.6667633056640625, -0.63531494140625, -0.6038665771484375, -0.572418212890625, -0.5409698486328125, -0.509521484375, -0.4780731201171875, -0.446624755859375, -0.4151763916015625, -0.38372802734375, -0.3522796630859375, -0.320831298828125, -0.2893829345703125, -0.2579345703125, -0.2264862060546875, -0.195037841796875, -0.1635894775390625, -0.13214111328125, -0.1006927490234375, -0.069244384765625, -0.0377960205078125, -0.00634765625, 0.0251007080078125, 0.056549072265625, 0.0879974365234375, 0.11944580078125, 0.1508941650390625, 0.182342529296875, 0.2137908935546875, 0.2452392578125, 0.2766876220703125, 0.308135986328125, 0.3395843505859375, 0.37103271484375, 0.4024810791015625, 0.433929443359375, 0.4653778076171875, 0.496826171875, 0.5282745361328125, 0.559722900390625, 0.5911712646484375, 0.62261962890625, 0.6540679931640625, 0.685516357421875, 0.7169647216796875, 0.7484130859375, 0.7798614501953125, 0.811309814453125, 0.8427581787109375, 0.87420654296875, 0.9056549072265625, 0.937103271484375, 0.9685516357421875, 1.0]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 14.0, 8.0, 8.0, 11.0, 18.0, 19.0, 27.0, 27.0, 33.0, 54.0, 71.0, 74.0, 87.0, 111.0, 98.0, 81.0, 42.0, 47.0, 30.0, 31.0, 18.0, 13.0, 13.0, 15.0, 14.0, 3.0, 5.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8785171508789062, -0.8502960205078125, -0.8220748901367188, -0.793853759765625, -0.7656326293945312, -0.7374114990234375, -0.7091903686523438, -0.68096923828125, -0.6527481079101562, -0.6245269775390625, -0.5963058471679688, -0.568084716796875, -0.5398635864257812, -0.5116424560546875, -0.48342132568359375, -0.4552001953125, -0.42697906494140625, -0.3987579345703125, -0.37053680419921875, -0.342315673828125, -0.31409454345703125, -0.2858734130859375, -0.25765228271484375, -0.22943115234375, -0.20121002197265625, -0.1729888916015625, -0.14476776123046875, -0.116546630859375, -0.08832550048828125, -0.0601043701171875, -0.03188323974609375, -0.003662109375, 0.02455902099609375, 0.0527801513671875, 0.08100128173828125, 0.109222412109375, 0.13744354248046875, 0.1656646728515625, 0.19388580322265625, 0.22210693359375, 0.25032806396484375, 0.2785491943359375, 0.30677032470703125, 0.334991455078125, 0.36321258544921875, 0.3914337158203125, 0.41965484619140625, 0.4478759765625, 0.47609710693359375, 0.5043182373046875, 0.5325393676757812, 0.560760498046875, 0.5889816284179688, 0.6172027587890625, 0.6454238891601562, 0.67364501953125, 0.7018661499023438, 0.7300872802734375, 0.7583084106445312, 0.786529541015625, 0.8147506713867188, 0.8429718017578125, 0.8711929321289062, 0.8994140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 26.0, 66.0, 189.0, 484.0, 152.0, 42.0, 14.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.89264678955078, -54.26520538330078, -52.63776397705078, -51.01032257080078, -49.38288116455078, -47.75543975830078, -46.12799835205078, -44.50055694580078, -42.87311553955078, -41.24567413330078, -39.61823272705078, -37.99079132080078, -36.36334991455078, -34.73590850830078, -33.10846710205078, -31.48102378845215, -29.853580474853516, -28.226139068603516, -26.598697662353516, -24.971256256103516, -23.343814849853516, -21.716373443603516, -20.088930130004883, -18.461488723754883, -16.834047317504883, -15.206605911254883, -13.579164505004883, -11.951722145080566, -10.324280738830566, -8.696839332580566, -7.06939697265625, -5.44195556640625, -3.81451416015625, -2.187072515487671, -0.5596308708190918, 1.0678110122680664, 2.6952524185180664, 4.322693824768066, 5.950136184692383, 7.577577590942383, 9.205018997192383, 10.832460403442383, 12.459901809692383, 14.0873441696167, 15.7147855758667, 17.342227935791016, 18.969669342041016, 20.597110748291016, 22.224552154541016, 23.851993560791016, 25.479434967041016, 27.106876373291016, 28.734317779541016, 30.361759185791016, 31.98920249938965, 33.61664581298828, 35.24408721923828, 36.87152862548828, 38.49897003173828, 40.12641143798828, 41.75385284423828, 43.38129425048828, 45.00873565673828, 46.63617706298828, 48.26361846923828]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 12.0, 17.0, 14.0, 18.0, 14.0, 19.0, 14.0, 24.0, 20.0, 30.0, 29.0, 25.0, 44.0, 71.0, 129.0, 140.0, 65.0, 40.0, 28.0, 28.0, 29.0, 29.0, 25.0, 19.0, 21.0, 12.0, 13.0, 13.0, 11.0, 8.0, 2.0, 5.0, 5.0, 10.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.746797561645508, -22.081905364990234, -21.417015075683594, -20.75212287902832, -20.087230682373047, -19.422338485717773, -18.757448196411133, -18.09255599975586, -17.427663803100586, -16.762771606445312, -16.097881317138672, -15.432989120483398, -14.768096923828125, -14.103205680847168, -13.438314437866211, -12.773422241210938, -12.10853099822998, -11.443639755249023, -10.77874755859375, -10.113856315612793, -9.44896411895752, -8.784072875976562, -8.119180679321289, -7.454289436340332, -6.789397716522217, -6.124505996704102, -5.459614276885986, -4.794722557067871, -4.129831314086914, -3.4649393558502197, -2.8000478744506836, -2.1351561546325684, -1.4702644348144531, -0.8053727746009827, -0.1404811143875122, 0.5244104862213135, 1.1893022060394287, 1.854193925857544, 2.51908540725708, 3.1839771270751953, 3.8488688468933105, 4.513760566711426, 5.178652286529541, 5.843544006347656, 6.508435249328613, 7.173327445983887, 7.838218688964844, 8.503110885620117, 9.168002128601074, 9.832893371582031, 10.497785568237305, 11.162676811218262, 11.827569007873535, 12.492460250854492, 13.157352447509766, 13.822243690490723, 14.48713493347168, 15.152026176452637, 15.81691837310791, 16.481809616088867, 17.14670181274414, 17.811594009399414, 18.476484298706055, 19.141376495361328, 19.8062686920166]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 8.0, 14.0, 15.0, 31.0, 54.0, 66.0, 122.0, 184.0, 288.0, 413.0, 698.0, 1301.0, 2582.0, 5823.0, 17117.0, 71135.0, 431678.0, 1988048.0, 1366930.0, 244886.0, 42257.0, 11644.0, 4317.0, 2004.0, 979.0, 585.0, 390.0, 234.0, 130.0, 102.0, 77.0, 51.0, 31.0, 26.0, 14.0, 13.0, 7.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.32879638671875, -2.2532958984375, -2.17779541015625, -2.102294921875, -2.02679443359375, -1.9512939453125, -1.87579345703125, -1.80029296875, -1.72479248046875, -1.6492919921875, -1.57379150390625, -1.498291015625, -1.42279052734375, -1.3472900390625, -1.27178955078125, -1.1962890625, -1.12078857421875, -1.0452880859375, -0.96978759765625, -0.894287109375, -0.81878662109375, -0.7432861328125, -0.66778564453125, -0.59228515625, -0.51678466796875, -0.4412841796875, -0.36578369140625, -0.290283203125, -0.21478271484375, -0.1392822265625, -0.06378173828125, 0.01171875, 0.08721923828125, 0.1627197265625, 0.23822021484375, 0.313720703125, 0.38922119140625, 0.4647216796875, 0.54022216796875, 0.61572265625, 0.69122314453125, 0.7667236328125, 0.84222412109375, 0.917724609375, 0.99322509765625, 1.0687255859375, 1.14422607421875, 1.2197265625, 1.29522705078125, 1.3707275390625, 1.44622802734375, 1.521728515625, 1.59722900390625, 1.6727294921875, 1.74822998046875, 1.82373046875, 1.89923095703125, 1.9747314453125, 2.05023193359375, 2.125732421875, 2.20123291015625, 2.2767333984375, 2.35223388671875, 2.427734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 8.0, 15.0, 7.0, 21.0, 9.0, 21.0, 20.0, 31.0, 24.0, 31.0, 35.0, 37.0, 39.0, 58.0, 37.0, 52.0, 52.0, 56.0, 57.0, 51.0, 55.0, 41.0, 35.0, 22.0, 41.0, 24.0, 24.0, 15.0, 10.0, 17.0, 17.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.494140625, -1.446868896484375, -1.39959716796875, -1.352325439453125, -1.3050537109375, -1.257781982421875, -1.21051025390625, -1.163238525390625, -1.115966796875, -1.068695068359375, -1.02142333984375, -0.974151611328125, -0.9268798828125, -0.879608154296875, -0.83233642578125, -0.785064697265625, -0.73779296875, -0.690521240234375, -0.64324951171875, -0.595977783203125, -0.5487060546875, -0.501434326171875, -0.45416259765625, -0.406890869140625, -0.359619140625, -0.312347412109375, -0.26507568359375, -0.217803955078125, -0.1705322265625, -0.123260498046875, -0.07598876953125, -0.028717041015625, 0.0185546875, 0.065826416015625, 0.11309814453125, 0.160369873046875, 0.2076416015625, 0.254913330078125, 0.30218505859375, 0.349456787109375, 0.396728515625, 0.444000244140625, 0.49127197265625, 0.538543701171875, 0.5858154296875, 0.633087158203125, 0.68035888671875, 0.727630615234375, 0.77490234375, 0.822174072265625, 0.86944580078125, 0.916717529296875, 0.9639892578125, 1.011260986328125, 1.05853271484375, 1.105804443359375, 1.153076171875, 1.200347900390625, 1.24761962890625, 1.294891357421875, 1.3421630859375, 1.389434814453125, 1.43670654296875, 1.483978271484375, 1.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 3.0, 8.0, 19.0, 27.0, 28.0, 54.0, 78.0, 136.0, 184.0, 248.0, 496.0, 891.0, 1831.0, 5546.0, 33326.0, 2261669.0, 1850124.0, 30638.0, 5081.0, 1783.0, 854.0, 458.0, 269.0, 170.0, 107.0, 80.0, 46.0, 22.0, 15.0, 30.0, 10.0, 10.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.50390625, -7.301025390625, -7.09814453125, -6.895263671875, -6.6923828125, -6.489501953125, -6.28662109375, -6.083740234375, -5.880859375, -5.677978515625, -5.47509765625, -5.272216796875, -5.0693359375, -4.866455078125, -4.66357421875, -4.460693359375, -4.2578125, -4.054931640625, -3.85205078125, -3.649169921875, -3.4462890625, -3.243408203125, -3.04052734375, -2.837646484375, -2.634765625, -2.431884765625, -2.22900390625, -2.026123046875, -1.8232421875, -1.620361328125, -1.41748046875, -1.214599609375, -1.01171875, -0.808837890625, -0.60595703125, -0.403076171875, -0.2001953125, 0.002685546875, 0.20556640625, 0.408447265625, 0.611328125, 0.814208984375, 1.01708984375, 1.219970703125, 1.4228515625, 1.625732421875, 1.82861328125, 2.031494140625, 2.234375, 2.437255859375, 2.64013671875, 2.843017578125, 3.0458984375, 3.248779296875, 3.45166015625, 3.654541015625, 3.857421875, 4.060302734375, 4.26318359375, 4.466064453125, 4.6689453125, 4.871826171875, 5.07470703125, 5.277587890625, 5.48046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 9.0, 11.0, 30.0, 14.0, 28.0, 48.0, 52.0, 83.0, 127.0, 168.0, 290.0, 479.0, 652.0, 676.0, 473.0, 305.0, 181.0, 142.0, 98.0, 74.0, 35.0, 25.0, 22.0, 15.0, 9.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0474853515625, -4.899658203125, -4.7518310546875, -4.60400390625, -4.4561767578125, -4.308349609375, -4.1605224609375, -4.0126953125, -3.8648681640625, -3.717041015625, -3.5692138671875, -3.42138671875, -3.2735595703125, -3.125732421875, -2.9779052734375, -2.830078125, -2.6822509765625, -2.534423828125, -2.3865966796875, -2.23876953125, -2.0909423828125, -1.943115234375, -1.7952880859375, -1.6474609375, -1.4996337890625, -1.351806640625, -1.2039794921875, -1.05615234375, -0.9083251953125, -0.760498046875, -0.6126708984375, -0.46484375, -0.3170166015625, -0.169189453125, -0.0213623046875, 0.12646484375, 0.2742919921875, 0.422119140625, 0.5699462890625, 0.7177734375, 0.8656005859375, 1.013427734375, 1.1612548828125, 1.30908203125, 1.4569091796875, 1.604736328125, 1.7525634765625, 1.900390625, 2.0482177734375, 2.196044921875, 2.3438720703125, 2.49169921875, 2.6395263671875, 2.787353515625, 2.9351806640625, 3.0830078125, 3.2308349609375, 3.378662109375, 3.5264892578125, 3.67431640625, 3.8221435546875, 3.969970703125, 4.1177978515625, 4.265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 4.0, 14.0, 13.0, 26.0, 50.0, 73.0, 158.0, 195.0, 179.0, 127.0, 61.0, 35.0, 15.0, 12.0, 10.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.82004165649414, -52.127037048339844, -50.43403244018555, -48.74102783203125, -47.04801940917969, -45.35501480102539, -43.662010192871094, -41.9690055847168, -40.2760009765625, -38.5829963684082, -36.889991760253906, -35.196983337402344, -33.50397872924805, -31.81097412109375, -30.117969512939453, -28.424964904785156, -26.731956481933594, -25.038951873779297, -23.345945358276367, -21.65294075012207, -19.95993423461914, -18.266929626464844, -16.573925018310547, -14.880919456481934, -13.18791389465332, -11.494908332824707, -9.801902770996094, -8.108898162841797, -6.415892601013184, -4.72288703918457, -3.0298824310302734, -1.3368768692016602, 0.35613250732421875, 2.049137830734253, 3.742143154144287, 5.435148239135742, 7.1281538009643555, 8.821159362792969, 10.514163970947266, 12.207169532775879, 13.900175094604492, 15.593180656433105, 17.28618621826172, 18.979190826416016, 20.672195434570312, 22.365201950073242, 24.05820655822754, 25.75121307373047, 27.444217681884766, 29.137222290039062, 30.830228805541992, 32.523231506347656, 34.21623992919922, 35.909244537353516, 37.60224914550781, 39.29525375366211, 40.988258361816406, 42.6812629699707, 44.374267578125, 46.06727600097656, 47.76028060913086, 49.453285217285156, 51.14628982543945, 52.83929443359375, 54.53230285644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 10.0, 10.0, 11.0, 14.0, 20.0, 23.0, 27.0, 25.0, 21.0, 22.0, 34.0, 31.0, 54.0, 43.0, 47.0, 56.0, 41.0, 51.0, 58.0, 56.0, 41.0, 41.0, 30.0, 27.0, 23.0, 23.0, 18.0, 29.0, 9.0, 13.0, 13.0, 12.0, 5.0, 7.0, 8.0, 5.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.02021026611328, -17.3231201171875, -16.626028060913086, -15.928937911987305, -15.231846809387207, -14.53475570678711, -13.837665557861328, -13.14057445526123, -12.443483352661133, -11.746392250061035, -11.049301147460938, -10.352210998535156, -9.655119895935059, -8.958028793334961, -8.26093864440918, -7.563847541809082, -6.866756439208984, -6.169665336608887, -5.472574710845947, -4.775484085083008, -4.07839298248291, -3.3813021183013916, -2.684211254119873, -1.9871206283569336, -1.290029525756836, -0.5929386615753174, 0.10415220260620117, 0.8012430667877197, 1.4983339309692383, 2.195424795150757, 2.8925156593322754, 3.589606285095215, 4.2866973876953125, 4.98378849029541, 5.68087911605835, 6.377969741821289, 7.075060844421387, 7.772151947021484, 8.469242095947266, 9.166333198547363, 9.863424301147461, 10.560515403747559, 11.257606506347656, 11.954696655273438, 12.651787757873535, 13.348878860473633, 14.045969009399414, 14.743060111999512, 15.44015121459961, 16.13724136352539, 16.834333419799805, 17.531423568725586, 18.228515625, 18.92560577392578, 19.622695922851562, 20.319786071777344, 21.016878128051758, 21.71396827697754, 22.411060333251953, 23.108150482177734, 23.805240631103516, 24.50233268737793, 25.19942283630371, 25.896514892578125, 26.593605041503906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 12.0, 17.0, 27.0, 27.0, 50.0, 78.0, 133.0, 203.0, 311.0, 548.0, 944.0, 1706.0, 3281.0, 6772.0, 15385.0, 39900.0, 124656.0, 469070.0, 264949.0, 73905.0, 25455.0, 10606.0, 4853.0, 2465.0, 1266.0, 753.0, 432.0, 256.0, 170.0, 104.0, 67.0, 43.0, 32.0, 21.0, 21.0, 8.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9609375, -1.890350341796875, -1.81976318359375, -1.749176025390625, -1.6785888671875, -1.608001708984375, -1.53741455078125, -1.466827392578125, -1.396240234375, -1.325653076171875, -1.25506591796875, -1.184478759765625, -1.1138916015625, -1.043304443359375, -0.97271728515625, -0.902130126953125, -0.83154296875, -0.760955810546875, -0.69036865234375, -0.619781494140625, -0.5491943359375, -0.478607177734375, -0.40802001953125, -0.337432861328125, -0.266845703125, -0.196258544921875, -0.12567138671875, -0.055084228515625, 0.0155029296875, 0.086090087890625, 0.15667724609375, 0.227264404296875, 0.2978515625, 0.368438720703125, 0.43902587890625, 0.509613037109375, 0.5802001953125, 0.650787353515625, 0.72137451171875, 0.791961669921875, 0.862548828125, 0.933135986328125, 1.00372314453125, 1.074310302734375, 1.1448974609375, 1.215484619140625, 1.28607177734375, 1.356658935546875, 1.42724609375, 1.497833251953125, 1.56842041015625, 1.639007568359375, 1.7095947265625, 1.780181884765625, 1.85076904296875, 1.921356201171875, 1.991943359375, 2.062530517578125, 2.13311767578125, 2.203704833984375, 2.2742919921875, 2.344879150390625, 2.41546630859375, 2.486053466796875, 2.556640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 11.0, 12.0, 15.0, 14.0, 22.0, 24.0, 34.0, 35.0, 35.0, 56.0, 58.0, 53.0, 66.0, 66.0, 60.0, 71.0, 54.0, 65.0, 41.0, 38.0, 34.0, 28.0, 26.0, 22.0, 15.0, 17.0, 10.0, 7.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94140625, -1.87445068359375, -1.8074951171875, -1.74053955078125, -1.673583984375, -1.60662841796875, -1.5396728515625, -1.47271728515625, -1.40576171875, -1.33880615234375, -1.2718505859375, -1.20489501953125, -1.137939453125, -1.07098388671875, -1.0040283203125, -0.93707275390625, -0.8701171875, -0.80316162109375, -0.7362060546875, -0.66925048828125, -0.602294921875, -0.53533935546875, -0.4683837890625, -0.40142822265625, -0.33447265625, -0.26751708984375, -0.2005615234375, -0.13360595703125, -0.066650390625, 0.00030517578125, 0.0672607421875, 0.13421630859375, 0.201171875, 0.26812744140625, 0.3350830078125, 0.40203857421875, 0.468994140625, 0.53594970703125, 0.6029052734375, 0.66986083984375, 0.73681640625, 0.80377197265625, 0.8707275390625, 0.93768310546875, 1.004638671875, 1.07159423828125, 1.1385498046875, 1.20550537109375, 1.2724609375, 1.33941650390625, 1.4063720703125, 1.47332763671875, 1.540283203125, 1.60723876953125, 1.6741943359375, 1.74114990234375, 1.80810546875, 1.87506103515625, 1.9420166015625, 2.00897216796875, 2.075927734375, 2.14288330078125, 2.2098388671875, 2.27679443359375, 2.34375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 0.0, 3.0, 4.0, 5.0, 12.0, 7.0, 18.0, 21.0, 22.0, 30.0, 27.0, 48.0, 61.0, 100.0, 137.0, 272.0, 413.0, 940.0, 2727.0, 12085.0, 145577.0, 839007.0, 38117.0, 5751.0, 1583.0, 650.0, 356.0, 184.0, 114.0, 95.0, 53.0, 40.0, 27.0, 23.0, 11.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.697265625, -3.57904052734375, -3.4608154296875, -3.34259033203125, -3.224365234375, -3.10614013671875, -2.9879150390625, -2.86968994140625, -2.75146484375, -2.63323974609375, -2.5150146484375, -2.39678955078125, -2.278564453125, -2.16033935546875, -2.0421142578125, -1.92388916015625, -1.8056640625, -1.68743896484375, -1.5692138671875, -1.45098876953125, -1.332763671875, -1.21453857421875, -1.0963134765625, -0.97808837890625, -0.85986328125, -0.74163818359375, -0.6234130859375, -0.50518798828125, -0.386962890625, -0.26873779296875, -0.1505126953125, -0.03228759765625, 0.0859375, 0.20416259765625, 0.3223876953125, 0.44061279296875, 0.558837890625, 0.67706298828125, 0.7952880859375, 0.91351318359375, 1.03173828125, 1.14996337890625, 1.2681884765625, 1.38641357421875, 1.504638671875, 1.62286376953125, 1.7410888671875, 1.85931396484375, 1.9775390625, 2.09576416015625, 2.2139892578125, 2.33221435546875, 2.450439453125, 2.56866455078125, 2.6868896484375, 2.80511474609375, 2.92333984375, 3.04156494140625, 3.1597900390625, 3.27801513671875, 3.396240234375, 3.51446533203125, 3.6326904296875, 3.75091552734375, 3.869140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 8.0, 8.0, 6.0, 5.0, 13.0, 13.0, 12.0, 18.0, 28.0, 31.0, 26.0, 35.0, 35.0, 45.0, 54.0, 84.0, 79.0, 80.0, 74.0, 67.0, 54.0, 35.0, 42.0, 22.0, 18.0, 14.0, 12.0, 12.0, 11.0, 11.0, 17.0, 5.0, 5.0, 0.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.03125, -7.8194580078125, -7.607666015625, -7.3958740234375, -7.18408203125, -6.9722900390625, -6.760498046875, -6.5487060546875, -6.3369140625, -6.1251220703125, -5.913330078125, -5.7015380859375, -5.48974609375, -5.2779541015625, -5.066162109375, -4.8543701171875, -4.642578125, -4.4307861328125, -4.218994140625, -4.0072021484375, -3.79541015625, -3.5836181640625, -3.371826171875, -3.1600341796875, -2.9482421875, -2.7364501953125, -2.524658203125, -2.3128662109375, -2.10107421875, -1.8892822265625, -1.677490234375, -1.4656982421875, -1.25390625, -1.0421142578125, -0.830322265625, -0.6185302734375, -0.40673828125, -0.1949462890625, 0.016845703125, 0.2286376953125, 0.4404296875, 0.6522216796875, 0.864013671875, 1.0758056640625, 1.28759765625, 1.4993896484375, 1.711181640625, 1.9229736328125, 2.134765625, 2.3465576171875, 2.558349609375, 2.7701416015625, 2.98193359375, 3.1937255859375, 3.405517578125, 3.6173095703125, 3.8291015625, 4.0408935546875, 4.252685546875, 4.4644775390625, 4.67626953125, 4.8880615234375, 5.099853515625, 5.3116455078125, 5.5234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 13.0, 11.0, 13.0, 23.0, 20.0, 31.0, 42.0, 66.0, 92.0, 152.0, 340.0, 702.0, 1585.0, 4555.0, 18138.0, 149916.0, 828623.0, 32985.0, 7054.0, 2213.0, 930.0, 409.0, 227.0, 132.0, 67.0, 43.0, 24.0, 24.0, 28.0, 20.0, 13.0, 12.0, 6.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5740737915039062, -0.5543975830078125, -0.5347213745117188, -0.515045166015625, -0.49536895751953125, -0.4756927490234375, -0.45601654052734375, -0.43634033203125, -0.41666412353515625, -0.3969879150390625, -0.37731170654296875, -0.357635498046875, -0.33795928955078125, -0.3182830810546875, -0.29860687255859375, -0.2789306640625, -0.25925445556640625, -0.2395782470703125, -0.21990203857421875, -0.200225830078125, -0.18054962158203125, -0.1608734130859375, -0.14119720458984375, -0.12152099609375, -0.10184478759765625, -0.0821685791015625, -0.06249237060546875, -0.042816162109375, -0.02313995361328125, -0.0034637451171875, 0.01621246337890625, 0.035888671875, 0.05556488037109375, 0.0752410888671875, 0.09491729736328125, 0.114593505859375, 0.13426971435546875, 0.1539459228515625, 0.17362213134765625, 0.19329833984375, 0.21297454833984375, 0.2326507568359375, 0.25232696533203125, 0.272003173828125, 0.29167938232421875, 0.3113555908203125, 0.33103179931640625, 0.3507080078125, 0.37038421630859375, 0.3900604248046875, 0.40973663330078125, 0.429412841796875, 0.44908905029296875, 0.4687652587890625, 0.48844146728515625, 0.50811767578125, 0.5277938842773438, 0.5474700927734375, 0.5671463012695312, 0.586822509765625, 0.6064987182617188, 0.6261749267578125, 0.6458511352539062, 0.66552734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 11.0, 7.0, 14.0, 14.0, 24.0, 45.0, 43.0, 103.0, 130.0, 141.0, 144.0, 87.0, 50.0, 37.0, 19.0, 24.0, 21.0, 9.0, 5.0, 10.0, 9.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017118453979492188, -0.00016557052731513977, -0.00015995651483535767, -0.00015434250235557556, -0.00014872848987579346, -0.00014311447739601135, -0.00013750046491622925, -0.00013188645243644714, -0.00012627243995666504, -0.00012065842747688293, -0.00011504441499710083, -0.00010943040251731873, -0.00010381639003753662, -9.820237755775452e-05, -9.258836507797241e-05, -8.697435259819031e-05, -8.13603401184082e-05, -7.57463276386261e-05, -7.0132315158844e-05, -6.451830267906189e-05, -5.8904290199279785e-05, -5.329027771949768e-05, -4.7676265239715576e-05, -4.206225275993347e-05, -3.644824028015137e-05, -3.083422780036926e-05, -2.5220215320587158e-05, -1.9606202840805054e-05, -1.399219036102295e-05, -8.378177881240845e-06, -2.7641654014587402e-06, 2.8498470783233643e-06, 8.463859558105469e-06, 1.4077872037887573e-05, 1.9691884517669678e-05, 2.5305896997451782e-05, 3.091990947723389e-05, 3.653392195701599e-05, 4.2147934436798096e-05, 4.77619469165802e-05, 5.3375959396362305e-05, 5.898997187614441e-05, 6.460398435592651e-05, 7.021799683570862e-05, 7.583200931549072e-05, 8.144602179527283e-05, 8.706003427505493e-05, 9.267404675483704e-05, 9.828805923461914e-05, 0.00010390207171440125, 0.00010951608419418335, 0.00011513009667396545, 0.00012074410915374756, 0.00012635812163352966, 0.00013197213411331177, 0.00013758614659309387, 0.00014320015907287598, 0.00014881417155265808, 0.00015442818403244019, 0.0001600421965122223, 0.0001656562089920044, 0.0001712702214717865, 0.0001768842339515686, 0.0001824982464313507, 0.0001881122589111328]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 20.0, 23.0, 37.0, 51.0, 77.0, 111.0, 208.0, 342.0, 613.0, 1231.0, 2872.0, 7350.0, 21821.0, 92823.0, 797953.0, 89120.0, 20988.0, 7227.0, 2885.0, 1279.0, 608.0, 330.0, 200.0, 115.0, 89.0, 55.0, 28.0, 18.0, 17.0, 14.0, 10.0, 2.0, 8.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4002571105957031, -0.38620758056640625, -0.3721580505371094, -0.3581085205078125, -0.3440589904785156, -0.33000946044921875, -0.3159599304199219, -0.301910400390625, -0.2878608703613281, -0.27381134033203125, -0.2597618103027344, -0.2457122802734375, -0.23166275024414062, -0.21761322021484375, -0.20356369018554688, -0.18951416015625, -0.17546463012695312, -0.16141510009765625, -0.14736557006835938, -0.1333160400390625, -0.11926651000976562, -0.10521697998046875, -0.09116744995117188, -0.077117919921875, -0.06306838989257812, -0.04901885986328125, -0.034969329833984375, -0.0209197998046875, -0.006870269775390625, 0.00717926025390625, 0.021228790283203125, 0.0352783203125, 0.049327850341796875, 0.06337738037109375, 0.07742691040039062, 0.0914764404296875, 0.10552597045898438, 0.11957550048828125, 0.13362503051757812, 0.147674560546875, 0.16172409057617188, 0.17577362060546875, 0.18982315063476562, 0.2038726806640625, 0.21792221069335938, 0.23197174072265625, 0.24602127075195312, 0.26007080078125, 0.2741203308105469, 0.28816986083984375, 0.3022193908691406, 0.3162689208984375, 0.3303184509277344, 0.34436798095703125, 0.3584175109863281, 0.372467041015625, 0.3865165710449219, 0.40056610107421875, 0.4146156311035156, 0.4286651611328125, 0.4427146911621094, 0.45676422119140625, 0.4708137512207031, 0.48486328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 9.0, 7.0, 17.0, 14.0, 20.0, 24.0, 47.0, 50.0, 85.0, 88.0, 108.0, 106.0, 97.0, 70.0, 56.0, 26.0, 35.0, 24.0, 19.0, 12.0, 17.0, 15.0, 8.0, 9.0, 9.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5520782470703125, -0.534332275390625, -0.5165863037109375, -0.49884033203125, -0.4810943603515625, -0.463348388671875, -0.4456024169921875, -0.4278564453125, -0.4101104736328125, -0.392364501953125, -0.3746185302734375, -0.35687255859375, -0.3391265869140625, -0.321380615234375, -0.3036346435546875, -0.285888671875, -0.2681427001953125, -0.250396728515625, -0.2326507568359375, -0.21490478515625, -0.1971588134765625, -0.179412841796875, -0.1616668701171875, -0.1439208984375, -0.1261749267578125, -0.108428955078125, -0.0906829833984375, -0.07293701171875, -0.0551910400390625, -0.037445068359375, -0.0196990966796875, -0.001953125, 0.0157928466796875, 0.033538818359375, 0.0512847900390625, 0.06903076171875, 0.0867767333984375, 0.104522705078125, 0.1222686767578125, 0.1400146484375, 0.1577606201171875, 0.175506591796875, 0.1932525634765625, 0.21099853515625, 0.2287445068359375, 0.246490478515625, 0.2642364501953125, 0.281982421875, 0.2997283935546875, 0.317474365234375, 0.3352203369140625, 0.35296630859375, 0.3707122802734375, 0.388458251953125, 0.4062042236328125, 0.4239501953125, 0.4416961669921875, 0.459442138671875, 0.4771881103515625, 0.49493408203125, 0.5126800537109375, 0.530426025390625, 0.5481719970703125, 0.56591796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 29.0, 89.0, 517.0, 273.0, 68.0, 13.0, 9.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.38037872314453, -33.6751708984375, -31.969966888427734, -30.264760971069336, -28.559555053710938, -26.85434913635254, -25.14914321899414, -23.443937301635742, -21.738731384277344, -20.033525466918945, -18.328319549560547, -16.62311363220215, -14.91790771484375, -13.212701797485352, -11.507495880126953, -9.802289962768555, -8.097084045410156, -6.391878128051758, -4.686672210693359, -2.981466293334961, -1.2762603759765625, 0.42894554138183594, 2.1341514587402344, 3.839357376098633, 5.544563293457031, 7.24976921081543, 8.954975128173828, 10.660181045532227, 12.365386962890625, 14.070592880249023, 15.775798797607422, 17.48100471496582, 19.18621063232422, 20.891416549682617, 22.596622467041016, 24.301828384399414, 26.007034301757812, 27.71224021911621, 29.41744613647461, 31.122652053833008, 32.827857971191406, 34.53306579589844, 36.2382698059082, 37.94347381591797, 39.648681640625, 41.35388946533203, 43.0590934753418, 44.76429748535156, 46.469505310058594, 48.174713134765625, 49.87991714477539, 51.585121154785156, 53.29032897949219, 54.99553680419922, 56.700740814208984, 58.40594482421875, 60.11115264892578, 61.81636047363281, 63.52156448364258, 65.22676849365234, 66.93197631835938, 68.6371841430664, 70.34239196777344, 72.04759216308594, 73.75279998779297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 2.0, 5.0, 8.0, 4.0, 12.0, 11.0, 14.0, 19.0, 10.0, 21.0, 19.0, 20.0, 27.0, 101.0, 123.0, 53.0, 55.0, 63.0, 153.0, 91.0, 21.0, 22.0, 22.0, 14.0, 11.0, 10.0, 19.0, 12.0, 12.0, 10.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.678874969482422, -16.091264724731445, -15.503654479980469, -14.916044235229492, -14.328433990478516, -13.740823745727539, -13.153213500976562, -12.565603256225586, -11.97799301147461, -11.390382766723633, -10.802772521972656, -10.21516227722168, -9.627552032470703, -9.039941787719727, -8.45233154296875, -7.864721775054932, -7.277112007141113, -6.689501762390137, -6.10189151763916, -5.514281272888184, -4.926671028137207, -4.3390607833862305, -3.751451015472412, -3.1638407707214355, -2.576230525970459, -1.9886202812194824, -1.4010101556777954, -0.8134000301361084, -0.22578978538513184, 0.3618204593658447, 0.9494304656982422, 1.5370407104492188, 2.1246509552001953, 2.712261199951172, 3.2998714447021484, 3.887481451034546, 4.475091934204102, 5.062702178955078, 5.6503119468688965, 6.237922191619873, 6.82553243637085, 7.413142681121826, 8.000752449035645, 8.588362693786621, 9.175972938537598, 9.763583183288574, 10.35119342803955, 10.938803672790527, 11.526413917541504, 12.11402416229248, 12.701634407043457, 13.289244651794434, 13.87685489654541, 14.464465141296387, 15.052074432373047, 15.639684677124023, 16.227294921875, 16.814905166625977, 17.402515411376953, 17.99012565612793, 18.577735900878906, 19.165346145629883, 19.75295639038086, 20.340566635131836, 20.928176879882812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 8.0, 14.0, 22.0, 8.0, 21.0, 29.0, 26.0, 37.0, 42.0, 44.0, 91.0, 254.0, 92.0, 42.0, 35.0, 28.0, 26.0, 27.0, 19.0, 12.0, 8.0, 16.0, 15.0, 10.0, 9.0, 8.0, 5.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5419921875, -1.48944091796875, -1.4368896484375, -1.38433837890625, -1.331787109375, -1.27923583984375, -1.2266845703125, -1.17413330078125, -1.12158203125, -1.06903076171875, -1.0164794921875, -0.96392822265625, -0.911376953125, -0.85882568359375, -0.8062744140625, -0.75372314453125, -0.701171875, -0.64862060546875, -0.5960693359375, -0.54351806640625, -0.490966796875, -0.43841552734375, -0.3858642578125, -0.33331298828125, -0.28076171875, -0.22821044921875, -0.1756591796875, -0.12310791015625, -0.070556640625, -0.01800537109375, 0.0345458984375, 0.08709716796875, 0.1396484375, 0.19219970703125, 0.2447509765625, 0.29730224609375, 0.349853515625, 0.40240478515625, 0.4549560546875, 0.50750732421875, 0.56005859375, 0.61260986328125, 0.6651611328125, 0.71771240234375, 0.770263671875, 0.82281494140625, 0.8753662109375, 0.92791748046875, 0.98046875, 1.03302001953125, 1.0855712890625, 1.13812255859375, 1.190673828125, 1.24322509765625, 1.2957763671875, 1.34832763671875, 1.40087890625, 1.45343017578125, 1.5059814453125, 1.55853271484375, 1.611083984375, 1.66363525390625, 1.7161865234375, 1.76873779296875, 1.8212890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 15.0, 6.0, 3.0, 14.0, 15.0, 49.0, 73.0, 121.0, 240.0, 799.0, 3983.0, 7760645.0, 617933.0, 3522.0, 697.0, 239.0, 108.0, 62.0, 19.0, 16.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.386871337890625, -29.542442321777344, -28.698013305664062, -27.85358428955078, -27.0091552734375, -26.16472625732422, -25.320297241210938, -24.475868225097656, -23.631439208984375, -22.787010192871094, -21.942581176757812, -21.09815216064453, -20.25372314453125, -19.40929412841797, -18.564865112304688, -17.720436096191406, -16.876007080078125, -16.031578063964844, -15.187149047851562, -14.342720031738281, -13.498291015625, -12.653861999511719, -11.809432983398438, -10.965003967285156, -10.120574951171875, -9.276145935058594, -8.431716918945312, -7.587287902832031, -6.74285888671875, -5.898429870605469, -5.0540008544921875, -4.209571838378906, -3.365142822265625, -2.5207138061523438, -1.6762847900390625, -0.8318557739257812, 0.0125732421875, 0.8570022583007812, 1.7014312744140625, 2.5458602905273438, 3.390289306640625, 4.234718322753906, 5.0791473388671875, 5.923576354980469, 6.76800537109375, 7.612434387207031, 8.456863403320312, 9.301292419433594, 10.145721435546875, 10.990150451660156, 11.834579467773438, 12.679008483886719, 13.5234375, 14.367866516113281, 15.212295532226562, 16.056724548339844, 16.901153564453125, 17.745582580566406, 18.590011596679688, 19.43444061279297, 20.27886962890625, 21.12329864501953, 21.967727661132812, 22.812156677246094, 23.656585693359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 9.0, 8.0, 0.0, 5.0, 3.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.01439094543457, -28.215744018554688, -27.417095184326172, -26.61844825744629, -25.819801330566406, -25.02115249633789, -24.222505569458008, -23.423858642578125, -22.62520980834961, -21.826562881469727, -21.02791404724121, -20.229267120361328, -19.430620193481445, -18.63197135925293, -17.833324432373047, -17.03467559814453, -16.23603057861328, -15.437382698059082, -14.6387357711792, -13.840087890625, -13.0414400100708, -12.242792129516602, -11.444145202636719, -10.64549732208252, -9.84684944152832, -9.048201560974121, -8.249554634094238, -7.450906753540039, -6.65225887298584, -5.853611469268799, -5.054964065551758, -4.256316184997559, -3.4576683044433594, -2.6590206623077393, -1.8603731393814087, -1.0617256164550781, -0.263077974319458, 0.5355696678161621, 1.3342170715332031, 2.1328649520874023, 2.9315123558044434, 3.7301599979400635, 4.528807640075684, 5.327455043792725, 6.126102447509766, 6.924750328063965, 7.723397731781006, 8.522045135498047, 9.320693016052246, 10.119340896606445, 10.917987823486328, 11.716635704040527, 12.515283584594727, 13.31393051147461, 14.112578392028809, 14.911226272583008, 15.70987319946289, 16.508520126342773, 17.30716896057129, 18.105815887451172, 18.904462814331055, 19.70311164855957, 20.501758575439453, 21.30040740966797, 22.09905433654785]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 8.0, 20.0, 16.0, 21.0, 44.0, 66.0, 99.0, 154.0, 232.0, 375.0, 684.0, 1322.0, 2851.0, 6344.0, 14290.0, 34784.0, 85534.0, 167712.0, 121103.0, 50709.0, 20856.0, 8786.0, 4090.0, 1827.0, 968.0, 513.0, 323.0, 191.0, 112.0, 62.0, 42.0, 28.0, 15.0, 24.0, 20.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.59375, -12.2308349609375, -11.867919921875, -11.5050048828125, -11.14208984375, -10.7791748046875, -10.416259765625, -10.0533447265625, -9.6904296875, -9.3275146484375, -8.964599609375, -8.6016845703125, -8.23876953125, -7.8758544921875, -7.512939453125, -7.1500244140625, -6.787109375, -6.4241943359375, -6.061279296875, -5.6983642578125, -5.33544921875, -4.9725341796875, -4.609619140625, -4.2467041015625, -3.8837890625, -3.5208740234375, -3.157958984375, -2.7950439453125, -2.43212890625, -2.0692138671875, -1.706298828125, -1.3433837890625, -0.98046875, -0.6175537109375, -0.254638671875, 0.1082763671875, 0.47119140625, 0.8341064453125, 1.197021484375, 1.5599365234375, 1.9228515625, 2.2857666015625, 2.648681640625, 3.0115966796875, 3.37451171875, 3.7374267578125, 4.100341796875, 4.4632568359375, 4.826171875, 5.1890869140625, 5.552001953125, 5.9149169921875, 6.27783203125, 6.6407470703125, 7.003662109375, 7.3665771484375, 7.7294921875, 8.0924072265625, 8.455322265625, 8.8182373046875, 9.18115234375, 9.5440673828125, 9.906982421875, 10.2698974609375, 10.6328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 8.0, 6.0, 8.0, 5.0, 13.0, 5.0, 14.0, 18.0, 18.0, 14.0, 32.0, 23.0, 31.0, 34.0, 31.0, 45.0, 49.0, 62.0, 55.0, 67.0, 53.0, 62.0, 40.0, 51.0, 40.0, 37.0, 30.0, 31.0, 26.0, 13.0, 11.0, 17.0, 7.0, 9.0, 7.0, 7.0, 4.0, 10.0, 8.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4193267822265625, -1.365020751953125, -1.3107147216796875, -1.25640869140625, -1.2021026611328125, -1.147796630859375, -1.0934906005859375, -1.0391845703125, -0.9848785400390625, -0.930572509765625, -0.8762664794921875, -0.82196044921875, -0.7676544189453125, -0.713348388671875, -0.6590423583984375, -0.604736328125, -0.5504302978515625, -0.496124267578125, -0.4418182373046875, -0.38751220703125, -0.3332061767578125, -0.278900146484375, -0.2245941162109375, -0.1702880859375, -0.1159820556640625, -0.061676025390625, -0.0073699951171875, 0.04693603515625, 0.1012420654296875, 0.155548095703125, 0.2098541259765625, 0.26416015625, 0.3184661865234375, 0.372772216796875, 0.4270782470703125, 0.48138427734375, 0.5356903076171875, 0.589996337890625, 0.6443023681640625, 0.6986083984375, 0.7529144287109375, 0.807220458984375, 0.8615264892578125, 0.91583251953125, 0.9701385498046875, 1.024444580078125, 1.0787506103515625, 1.133056640625, 1.1873626708984375, 1.241668701171875, 1.2959747314453125, 1.35028076171875, 1.4045867919921875, 1.458892822265625, 1.5131988525390625, 1.5675048828125, 1.6218109130859375, 1.676116943359375, 1.7304229736328125, 1.78472900390625, 1.8390350341796875, 1.893341064453125, 1.9476470947265625, 2.001953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 22.0, 35.0, 55.0, 97.0, 71.0, 75.0, 34.0, 17.0, 11.0, 12.0, 4.0, 9.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.008161544799805, -15.497745513916016, -14.98732852935791, -14.476912498474121, -13.966495513916016, -13.456079483032227, -12.945663452148438, -12.435246467590332, -11.924829483032227, -11.414413452148438, -10.903996467590332, -10.393580436706543, -9.883163452148438, -9.372747421264648, -8.86233139038086, -8.351914405822754, -7.841498374938965, -7.331081867218018, -6.82066535949707, -6.310249328613281, -5.799832344055176, -5.289416313171387, -4.7789998054504395, -4.268583297729492, -3.758166790008545, -3.2477502822875977, -2.7373337745666504, -2.2269175052642822, -1.716500997543335, -1.2060844898223877, -0.6956682205200195, -0.18525171279907227, 0.325164794921875, 0.8355812430381775, 1.34599769115448, 1.8564140796661377, 2.366830587387085, 2.8772470951080322, 3.3876633644104004, 3.8980798721313477, 4.408496379852295, 4.918912887573242, 5.4293293952941895, 5.939745903015137, 6.450161933898926, 6.960578918457031, 7.47099494934082, 7.981411457061768, 8.491827964782715, 9.002243995666504, 9.51266098022461, 10.023077011108398, 10.533493995666504, 11.043910026550293, 11.554327011108398, 12.064743041992188, 12.575159072875977, 13.085575103759766, 13.595992088317871, 14.10640811920166, 14.616825103759766, 15.127241134643555, 15.637657165527344, 16.148075103759766, 16.658491134643555]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 10.0, 12.0, 20.0, 38.0, 46.0, 58.0, 62.0, 59.0, 37.0, 31.0, 18.0, 12.0, 8.0, 7.0, 6.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081541538238525, -6.814149379730225, -6.546757698059082, -6.279365539550781, -6.0119733810424805, -5.744581699371338, -5.477189540863037, -5.2097978591918945, -4.942405700683594, -4.675013542175293, -4.40762186050415, -4.14022970199585, -3.872837781906128, -3.6054458618164062, -3.3380537033081055, -3.070661783218384, -2.803269863128662, -2.5358779430389404, -2.2684860229492188, -2.001093864440918, -1.7337019443511963, -1.4663100242614746, -1.1989179849624634, -0.9315259456634521, -0.6641340255737305, -0.396742045879364, -0.12935006618499756, 0.1380419135093689, 0.40543389320373535, 0.672825813293457, 0.9402178525924683, 1.2076098918914795, 1.4750022888183594, 1.742394208908081, 2.0097861289978027, 2.2771782875061035, 2.544570207595825, 2.811962127685547, 3.0793542861938477, 3.3467462062835693, 3.614138126373291, 3.8815300464630127, 4.148921966552734, 4.416314125061035, 4.683706283569336, 4.9510979652404785, 5.218490123748779, 5.485881805419922, 5.753273963928223, 6.020666122436523, 6.288057804107666, 6.555449962615967, 6.822841644287109, 7.09023380279541, 7.357625961303711, 7.625018119812012, 7.892409801483154, 8.159801483154297, 8.427193641662598, 8.694585800170898, 8.9619779586792, 9.2293701171875, 9.496761322021484, 9.764153480529785, 10.031545639038086]}, "eval/loss": 1.8364678621292114, "eval/wer": 0.2812376041253471, "eval/runtime": 832.195, "eval/samples_per_second": 3.175, "eval/steps_per_second": 0.398} \ No newline at end of file +{"train/loss": 0.0162, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 108038, "_timestamp": 1647482580, "_step": 17851, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 12.0, 6.0, 8.0, 6.0, 12.0, 15.0, 17.0, 22.0, 35.0, 43.0, 41.0, 53.0, 54.0, 47.0, 56.0, 65.0, 50.0, 58.0, 50.0, 53.0, 44.0, 45.0, 43.0, 38.0, 23.0, 22.0, 17.0, 19.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.21875762939453, -88.52344512939453, -86.828125, -85.1328125, -83.43749237060547, -81.74217987060547, -80.04685974121094, -78.35154724121094, -76.65623474121094, -74.96092224121094, -73.2656021118164, -71.5702896118164, -69.87496948242188, -68.17965698242188, -66.48433685302734, -64.78902435302734, -63.09370422363281, -61.39838790893555, -59.70307159423828, -58.007755279541016, -56.31243896484375, -54.61712646484375, -52.921810150146484, -51.22649383544922, -49.53117752075195, -47.83586120605469, -46.14054489135742, -44.445228576660156, -42.749916076660156, -41.054595947265625, -39.359283447265625, -37.66396713256836, -35.96865463256836, -34.273338317871094, -32.57802200317383, -30.882707595825195, -29.18739128112793, -27.492074966430664, -25.79676055908203, -24.101444244384766, -22.4061279296875, -20.710811614990234, -19.01549530029297, -17.320180892944336, -15.62486457824707, -13.929548263549805, -12.234232902526855, -10.538917541503906, -8.84360122680664, -7.148285388946533, -5.452969551086426, -3.7576537132263184, -2.062337875366211, -0.3670215606689453, 1.328293800354004, 3.023609161376953, 4.718925476074219, 6.414241313934326, 8.109557151794434, 9.804872512817383, 11.500188827514648, 13.195505142211914, 14.890820503234863, 16.586135864257812, 18.281452178955078]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 2.0, 7.0, 7.0, 12.0, 14.0, 7.0, 15.0, 15.0, 26.0, 24.0, 24.0, 22.0, 35.0, 31.0, 23.0, 37.0, 38.0, 36.0, 32.0, 50.0, 48.0, 40.0, 41.0, 39.0, 35.0, 33.0, 49.0, 19.0, 29.0, 29.0, 18.0, 25.0, 19.0, 16.0, 24.0, 9.0, 14.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.85319900512695, -38.5408935546875, -37.22859191894531, -35.91628646850586, -34.60398483276367, -33.29167938232422, -31.9793758392334, -30.667072296142578, -29.354766845703125, -28.042463302612305, -26.730159759521484, -25.41785430908203, -24.10555076599121, -22.79324722290039, -21.48094367980957, -20.16864013671875, -18.85633659362793, -17.54403305053711, -16.23172950744629, -14.919425010681152, -13.607120513916016, -12.294816970825195, -10.982513427734375, -9.670208930969238, -8.357905387878418, -7.0456013679504395, -5.733297348022461, -4.420993804931641, -3.108689785003662, -1.7963857650756836, -0.4840822219848633, 0.8282222747802734, 2.1405258178710938, 3.4528298377990723, 4.765133857727051, 6.077437400817871, 7.38974142074585, 8.702045440673828, 10.014348983764648, 11.326653480529785, 12.638957023620605, 13.951260566711426, 15.263565063476562, 16.575868606567383, 17.888172149658203, 19.200477600097656, 20.512779235839844, 21.825084686279297, 23.137388229370117, 24.449691772460938, 25.761995315551758, 27.074298858642578, 28.38660430908203, 29.69890785217285, 31.011211395263672, 32.323516845703125, 33.63581848144531, 34.948123931884766, 36.26042556762695, 37.572731018066406, 38.885032653808594, 40.19733810424805, 41.5096435546875, 42.82194519042969, 44.13425064086914]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 25.0, 40.0, 47.0, 82.0, 141.0, 254.0, 401.0, 613.0, 991.0, 1579.0, 2531.0, 4057.0, 6334.0, 10190.0, 15867.0, 25238.0, 39251.0, 60422.0, 93260.0, 140151.0, 206561.0, 294505.0, 398751.0, 495048.0, 539183.0, 503644.0, 412134.0, 306321.0, 215690.0, 146820.0, 97775.0, 62907.0, 41042.0, 26517.0, 16954.0, 10778.0, 6679.0, 4275.0, 2650.0, 1652.0, 1122.0, 678.0, 415.0, 250.0, 173.0, 99.0, 64.0, 38.0, 33.0, 10.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0], "bins": [-69.375, -67.244140625, -65.11328125, -62.982421875, -60.8515625, -58.720703125, -56.58984375, -54.458984375, -52.328125, -50.197265625, -48.06640625, -45.935546875, -43.8046875, -41.673828125, -39.54296875, -37.412109375, -35.28125, -33.150390625, -31.01953125, -28.888671875, -26.7578125, -24.626953125, -22.49609375, -20.365234375, -18.234375, -16.103515625, -13.97265625, -11.841796875, -9.7109375, -7.580078125, -5.44921875, -3.318359375, -1.1875, 0.943359375, 3.07421875, 5.205078125, 7.3359375, 9.466796875, 11.59765625, 13.728515625, 15.859375, 17.990234375, 20.12109375, 22.251953125, 24.3828125, 26.513671875, 28.64453125, 30.775390625, 32.90625, 35.037109375, 37.16796875, 39.298828125, 41.4296875, 43.560546875, 45.69140625, 47.822265625, 49.953125, 52.083984375, 54.21484375, 56.345703125, 58.4765625, 60.607421875, 62.73828125, 64.869140625, 67.0]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 3.0, 8.0, 12.0, 9.0, 7.0, 7.0, 9.0, 20.0, 23.0, 17.0, 19.0, 19.0, 32.0, 23.0, 21.0, 29.0, 28.0, 30.0, 42.0, 37.0, 47.0, 35.0, 42.0, 34.0, 29.0, 32.0, 33.0, 40.0, 29.0, 17.0, 22.0, 24.0, 28.0, 23.0, 16.0, 8.0, 15.0, 16.0, 24.0, 10.0, 10.0, 10.0, 11.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 6.0], "bins": [-44.59375, -43.29345703125, -41.9931640625, -40.69287109375, -39.392578125, -38.09228515625, -36.7919921875, -35.49169921875, -34.19140625, -32.89111328125, -31.5908203125, -30.29052734375, -28.990234375, -27.68994140625, -26.3896484375, -25.08935546875, -23.7890625, -22.48876953125, -21.1884765625, -19.88818359375, -18.587890625, -17.28759765625, -15.9873046875, -14.68701171875, -13.38671875, -12.08642578125, -10.7861328125, -9.48583984375, -8.185546875, -6.88525390625, -5.5849609375, -4.28466796875, -2.984375, -1.68408203125, -0.3837890625, 0.91650390625, 2.216796875, 3.51708984375, 4.8173828125, 6.11767578125, 7.41796875, 8.71826171875, 10.0185546875, 11.31884765625, 12.619140625, 13.91943359375, 15.2197265625, 16.52001953125, 17.8203125, 19.12060546875, 20.4208984375, 21.72119140625, 23.021484375, 24.32177734375, 25.6220703125, 26.92236328125, 28.22265625, 29.52294921875, 30.8232421875, 32.12353515625, 33.423828125, 34.72412109375, 36.0244140625, 37.32470703125, 38.625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 11.0, 12.0, 27.0, 26.0, 44.0, 74.0, 134.0, 188.0, 283.0, 516.0, 890.0, 1421.0, 2352.0, 3865.0, 6632.0, 11175.0, 18153.0, 29958.0, 48549.0, 76983.0, 119442.0, 180406.0, 259012.0, 353465.0, 443011.0, 505307.0, 508941.0, 454892.0, 365317.0, 272535.0, 189286.0, 126771.0, 81705.0, 51802.0, 31955.0, 19354.0, 11873.0, 7158.0, 4307.0, 2539.0, 1601.0, 909.0, 554.0, 342.0, 180.0, 125.0, 80.0, 47.0, 28.0, 18.0, 12.0, 11.0, 3.0, 3.0, 3.0], "bins": [-63.9375, -62.1142578125, -60.291015625, -58.4677734375, -56.64453125, -54.8212890625, -52.998046875, -51.1748046875, -49.3515625, -47.5283203125, -45.705078125, -43.8818359375, -42.05859375, -40.2353515625, -38.412109375, -36.5888671875, -34.765625, -32.9423828125, -31.119140625, -29.2958984375, -27.47265625, -25.6494140625, -23.826171875, -22.0029296875, -20.1796875, -18.3564453125, -16.533203125, -14.7099609375, -12.88671875, -11.0634765625, -9.240234375, -7.4169921875, -5.59375, -3.7705078125, -1.947265625, -0.1240234375, 1.69921875, 3.5224609375, 5.345703125, 7.1689453125, 8.9921875, 10.8154296875, 12.638671875, 14.4619140625, 16.28515625, 18.1083984375, 19.931640625, 21.7548828125, 23.578125, 25.4013671875, 27.224609375, 29.0478515625, 30.87109375, 32.6943359375, 34.517578125, 36.3408203125, 38.1640625, 39.9873046875, 41.810546875, 43.6337890625, 45.45703125, 47.2802734375, 49.103515625, 50.9267578125, 52.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 8.0, 4.0, 6.0, 13.0, 10.0, 21.0, 16.0, 24.0, 26.0, 31.0, 30.0, 48.0, 58.0, 77.0, 75.0, 86.0, 118.0, 124.0, 114.0, 150.0, 153.0, 144.0, 208.0, 194.0, 204.0, 208.0, 216.0, 222.0, 181.0, 174.0, 173.0, 137.0, 132.0, 109.0, 109.0, 89.0, 70.0, 64.0, 50.0, 41.0, 39.0, 36.0, 20.0, 16.0, 10.0, 15.0, 5.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.989013671875, -21.21240234375, -20.435791015625, -19.6591796875, -18.882568359375, -18.10595703125, -17.329345703125, -16.552734375, -15.776123046875, -14.99951171875, -14.222900390625, -13.4462890625, -12.669677734375, -11.89306640625, -11.116455078125, -10.33984375, -9.563232421875, -8.78662109375, -8.010009765625, -7.2333984375, -6.456787109375, -5.68017578125, -4.903564453125, -4.126953125, -3.350341796875, -2.57373046875, -1.797119140625, -1.0205078125, -0.243896484375, 0.53271484375, 1.309326171875, 2.0859375, 2.862548828125, 3.63916015625, 4.415771484375, 5.1923828125, 5.968994140625, 6.74560546875, 7.522216796875, 8.298828125, 9.075439453125, 9.85205078125, 10.628662109375, 11.4052734375, 12.181884765625, 12.95849609375, 13.735107421875, 14.51171875, 15.288330078125, 16.06494140625, 16.841552734375, 17.6181640625, 18.394775390625, 19.17138671875, 19.947998046875, 20.724609375, 21.501220703125, 22.27783203125, 23.054443359375, 23.8310546875, 24.607666015625, 25.38427734375, 26.160888671875, 26.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 13.0, 25.0, 20.0, 19.0, 29.0, 29.0, 32.0, 37.0, 40.0, 34.0, 62.0, 40.0, 40.0, 39.0, 40.0, 51.0, 46.0, 42.0, 44.0, 35.0, 44.0, 26.0, 29.0, 25.0, 25.0, 21.0, 17.0, 14.0, 16.0, 10.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-78.66213989257812, -76.70450592041016, -74.74687957763672, -72.78924560546875, -70.83161163330078, -68.87398529052734, -66.91635131835938, -64.9587173461914, -63.00109100341797, -61.043460845947266, -59.0858268737793, -57.128196716308594, -55.17056655883789, -53.21293640136719, -51.25530242919922, -49.297672271728516, -47.34003829956055, -45.382408142089844, -43.424774169921875, -41.46714401245117, -39.50951385498047, -37.5518798828125, -35.5942497253418, -33.636619567871094, -31.678987503051758, -29.721355438232422, -27.76372528076172, -25.806093215942383, -23.848461151123047, -21.890830993652344, -19.933198928833008, -17.975566864013672, -16.01793670654297, -14.06030559539795, -12.10267448425293, -10.145042419433594, -8.187411308288574, -6.229780197143555, -4.272148132324219, -2.314517021179199, -0.3568859100341797, 1.600745439529419, 3.5583767890930176, 5.516008377075195, 7.473639488220215, 9.431270599365234, 11.38890266418457, 13.34653377532959, 15.30416488647461, 17.261796951293945, 19.21942710876465, 21.177059173583984, 23.134689331054688, 25.092321395874023, 27.04995346069336, 29.007583618164062, 30.9652156829834, 32.922847747802734, 34.88047790527344, 36.838111877441406, 38.79574203491211, 40.75337219238281, 42.71100616455078, 44.668636322021484, 46.62626647949219]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 9.0, 19.0, 19.0, 17.0, 25.0, 30.0, 20.0, 25.0, 38.0, 39.0, 30.0, 35.0, 28.0, 41.0, 38.0, 50.0, 41.0, 42.0, 46.0, 35.0, 28.0, 31.0, 26.0, 42.0, 27.0, 34.0, 23.0, 19.0, 18.0, 13.0, 10.0, 10.0, 7.0, 12.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.91980743408203, -60.128684997558594, -58.33755874633789, -56.54643630981445, -54.75531005859375, -52.96418762207031, -51.173065185546875, -49.38194274902344, -47.590816497802734, -45.7996940612793, -44.008567810058594, -42.217445373535156, -40.42632293701172, -38.635196685791016, -36.84407424926758, -35.052947998046875, -33.26182556152344, -31.470701217651367, -29.679576873779297, -27.88845443725586, -26.09733009338379, -24.30620574951172, -22.51508331298828, -20.72395896911621, -18.93283462524414, -17.14171028137207, -15.350586891174316, -13.559463500976562, -11.768339157104492, -9.977214813232422, -8.186091423034668, -6.394968032836914, -4.603847503662109, -2.8127236366271973, -1.0215997695922852, 0.769524097442627, 2.560647964477539, 4.351772308349609, 6.142895698547363, 7.934019088745117, 9.725143432617188, 11.516267776489258, 13.307391166687012, 15.098514556884766, 16.889638900756836, 18.680763244628906, 20.471885681152344, 22.263010025024414, 24.054134368896484, 25.845258712768555, 27.636383056640625, 29.427505493164062, 31.218629837036133, 33.0097541809082, 34.80087661743164, 36.592002868652344, 38.38312530517578, 40.17424774169922, 41.96537399291992, 43.75649642944336, 45.54762268066406, 47.3387451171875, 49.12986755371094, 50.920989990234375, 52.71211624145508]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 12.0, 13.0, 28.0, 43.0, 55.0, 60.0, 123.0, 208.0, 287.0, 476.0, 743.0, 1171.0, 1851.0, 3053.0, 4997.0, 8039.0, 13451.0, 22545.0, 37176.0, 60395.0, 93730.0, 133593.0, 161822.0, 156923.0, 124441.0, 85225.0, 54203.0, 32889.0, 20007.0, 11904.0, 7386.0, 4376.0, 2726.0, 1632.0, 1085.0, 678.0, 388.0, 297.0, 198.0, 110.0, 84.0, 41.0, 29.0, 19.0, 16.0, 6.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-27.84375, -26.970458984375, -26.09716796875, -25.223876953125, -24.3505859375, -23.477294921875, -22.60400390625, -21.730712890625, -20.857421875, -19.984130859375, -19.11083984375, -18.237548828125, -17.3642578125, -16.490966796875, -15.61767578125, -14.744384765625, -13.87109375, -12.997802734375, -12.12451171875, -11.251220703125, -10.3779296875, -9.504638671875, -8.63134765625, -7.758056640625, -6.884765625, -6.011474609375, -5.13818359375, -4.264892578125, -3.3916015625, -2.518310546875, -1.64501953125, -0.771728515625, 0.1015625, 0.974853515625, 1.84814453125, 2.721435546875, 3.5947265625, 4.468017578125, 5.34130859375, 6.214599609375, 7.087890625, 7.961181640625, 8.83447265625, 9.707763671875, 10.5810546875, 11.454345703125, 12.32763671875, 13.200927734375, 14.07421875, 14.947509765625, 15.82080078125, 16.694091796875, 17.5673828125, 18.440673828125, 19.31396484375, 20.187255859375, 21.060546875, 21.933837890625, 22.80712890625, 23.680419921875, 24.5537109375, 25.427001953125, 26.30029296875, 27.173583984375, 28.046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 9.0, 8.0, 13.0, 16.0, 16.0, 17.0, 18.0, 24.0, 34.0, 16.0, 21.0, 36.0, 40.0, 31.0, 25.0, 36.0, 38.0, 41.0, 40.0, 41.0, 43.0, 41.0, 38.0, 33.0, 30.0, 24.0, 37.0, 34.0, 29.0, 27.0, 22.0, 16.0, 17.0, 15.0, 9.0, 7.0, 9.0, 8.0, 11.0, 8.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-63.125, -61.3271484375, -59.529296875, -57.7314453125, -55.93359375, -54.1357421875, -52.337890625, -50.5400390625, -48.7421875, -46.9443359375, -45.146484375, -43.3486328125, -41.55078125, -39.7529296875, -37.955078125, -36.1572265625, -34.359375, -32.5615234375, -30.763671875, -28.9658203125, -27.16796875, -25.3701171875, -23.572265625, -21.7744140625, -19.9765625, -18.1787109375, -16.380859375, -14.5830078125, -12.78515625, -10.9873046875, -9.189453125, -7.3916015625, -5.59375, -3.7958984375, -1.998046875, -0.2001953125, 1.59765625, 3.3955078125, 5.193359375, 6.9912109375, 8.7890625, 10.5869140625, 12.384765625, 14.1826171875, 15.98046875, 17.7783203125, 19.576171875, 21.3740234375, 23.171875, 24.9697265625, 26.767578125, 28.5654296875, 30.36328125, 32.1611328125, 33.958984375, 35.7568359375, 37.5546875, 39.3525390625, 41.150390625, 42.9482421875, 44.74609375, 46.5439453125, 48.341796875, 50.1396484375, 51.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 9.0, 10.0, 19.0, 30.0, 36.0, 43.0, 67.0, 76.0, 119.0, 172.0, 235.0, 322.0, 479.0, 715.0, 1129.0, 1667.0, 2723.0, 4209.0, 7163.0, 12027.0, 22436.0, 56611.0, 843408.0, 44976.0, 20407.0, 11344.0, 6641.0, 4013.0, 2580.0, 1604.0, 1038.0, 692.0, 449.0, 321.0, 250.0, 138.0, 88.0, 87.0, 58.0, 37.0, 32.0, 31.0, 16.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-58.9375, -57.1201171875, -55.302734375, -53.4853515625, -51.66796875, -49.8505859375, -48.033203125, -46.2158203125, -44.3984375, -42.5810546875, -40.763671875, -38.9462890625, -37.12890625, -35.3115234375, -33.494140625, -31.6767578125, -29.859375, -28.0419921875, -26.224609375, -24.4072265625, -22.58984375, -20.7724609375, -18.955078125, -17.1376953125, -15.3203125, -13.5029296875, -11.685546875, -9.8681640625, -8.05078125, -6.2333984375, -4.416015625, -2.5986328125, -0.78125, 1.0361328125, 2.853515625, 4.6708984375, 6.48828125, 8.3056640625, 10.123046875, 11.9404296875, 13.7578125, 15.5751953125, 17.392578125, 19.2099609375, 21.02734375, 22.8447265625, 24.662109375, 26.4794921875, 28.296875, 30.1142578125, 31.931640625, 33.7490234375, 35.56640625, 37.3837890625, 39.201171875, 41.0185546875, 42.8359375, 44.6533203125, 46.470703125, 48.2880859375, 50.10546875, 51.9228515625, 53.740234375, 55.5576171875, 57.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 9.0, 8.0, 6.0, 15.0, 10.0, 16.0, 14.0, 22.0, 14.0, 21.0, 20.0, 23.0, 38.0, 34.0, 42.0, 29.0, 44.0, 37.0, 40.0, 54.0, 45.0, 39.0, 27.0, 46.0, 40.0, 33.0, 40.0, 28.0, 40.0, 28.0, 28.0, 17.0, 13.0, 22.0, 14.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.65625, -39.41064453125, -38.1650390625, -36.91943359375, -35.673828125, -34.42822265625, -33.1826171875, -31.93701171875, -30.69140625, -29.44580078125, -28.2001953125, -26.95458984375, -25.708984375, -24.46337890625, -23.2177734375, -21.97216796875, -20.7265625, -19.48095703125, -18.2353515625, -16.98974609375, -15.744140625, -14.49853515625, -13.2529296875, -12.00732421875, -10.76171875, -9.51611328125, -8.2705078125, -7.02490234375, -5.779296875, -4.53369140625, -3.2880859375, -2.04248046875, -0.796875, 0.44873046875, 1.6943359375, 2.93994140625, 4.185546875, 5.43115234375, 6.6767578125, 7.92236328125, 9.16796875, 10.41357421875, 11.6591796875, 12.90478515625, 14.150390625, 15.39599609375, 16.6416015625, 17.88720703125, 19.1328125, 20.37841796875, 21.6240234375, 22.86962890625, 24.115234375, 25.36083984375, 26.6064453125, 27.85205078125, 29.09765625, 30.34326171875, 31.5888671875, 32.83447265625, 34.080078125, 35.32568359375, 36.5712890625, 37.81689453125, 39.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 5.0, 13.0, 11.0, 19.0, 49.0, 39.0, 72.0, 85.0, 142.0, 213.0, 415.0, 938.0, 2470.0, 10350.0, 92506.0, 916821.0, 18308.0, 3572.0, 1174.0, 541.0, 275.0, 138.0, 118.0, 61.0, 46.0, 39.0, 20.0, 18.0, 23.0, 11.0, 11.0, 6.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.0859375, -11.721435546875, -11.35693359375, -10.992431640625, -10.6279296875, -10.263427734375, -9.89892578125, -9.534423828125, -9.169921875, -8.805419921875, -8.44091796875, -8.076416015625, -7.7119140625, -7.347412109375, -6.98291015625, -6.618408203125, -6.25390625, -5.889404296875, -5.52490234375, -5.160400390625, -4.7958984375, -4.431396484375, -4.06689453125, -3.702392578125, -3.337890625, -2.973388671875, -2.60888671875, -2.244384765625, -1.8798828125, -1.515380859375, -1.15087890625, -0.786376953125, -0.421875, -0.057373046875, 0.30712890625, 0.671630859375, 1.0361328125, 1.400634765625, 1.76513671875, 2.129638671875, 2.494140625, 2.858642578125, 3.22314453125, 3.587646484375, 3.9521484375, 4.316650390625, 4.68115234375, 5.045654296875, 5.41015625, 5.774658203125, 6.13916015625, 6.503662109375, 6.8681640625, 7.232666015625, 7.59716796875, 7.961669921875, 8.326171875, 8.690673828125, 9.05517578125, 9.419677734375, 9.7841796875, 10.148681640625, 10.51318359375, 10.877685546875, 11.2421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 23.0, 30.0, 33.0, 54.0, 77.0, 108.0, 137.0, 147.0, 102.0, 86.0, 60.0, 36.0, 18.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005898475646972656, -0.0005728527903556824, -0.0005558580160140991, -0.0005388632416725159, -0.0005218684673309326, -0.0005048736929893494, -0.0004878789186477661, -0.00047088414430618286, -0.0004538893699645996, -0.00043689459562301636, -0.0004198998212814331, -0.00040290504693984985, -0.0003859102725982666, -0.00036891549825668335, -0.0003519207239151001, -0.00033492594957351685, -0.0003179311752319336, -0.00030093640089035034, -0.0002839416265487671, -0.00026694685220718384, -0.0002499520778656006, -0.00023295730352401733, -0.00021596252918243408, -0.00019896775484085083, -0.00018197298049926758, -0.00016497820615768433, -0.00014798343181610107, -0.00013098865747451782, -0.00011399388313293457, -9.699910879135132e-05, -8.000433444976807e-05, -6.300956010818481e-05, -4.601478576660156e-05, -2.902001142501831e-05, -1.2025237083435059e-05, 4.969537258148193e-06, 2.1964311599731445e-05, 3.89590859413147e-05, 5.595386028289795e-05, 7.29486346244812e-05, 8.994340896606445e-05, 0.0001069381833076477, 0.00012393295764923096, 0.0001409277319908142, 0.00015792250633239746, 0.0001749172806739807, 0.00019191205501556396, 0.00020890682935714722, 0.00022590160369873047, 0.00024289637804031372, 0.00025989115238189697, 0.0002768859267234802, 0.0002938807010650635, 0.00031087547540664673, 0.00032787024974823, 0.00034486502408981323, 0.0003618597984313965, 0.00037885457277297974, 0.000395849347114563, 0.00041284412145614624, 0.0004298388957977295, 0.00044683367013931274, 0.000463828444480896, 0.00048082321882247925, 0.0004978179931640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 18.0, 26.0, 27.0, 44.0, 60.0, 74.0, 151.0, 212.0, 399.0, 745.0, 1475.0, 3388.0, 8242.0, 20828.0, 54635.0, 139127.0, 277642.0, 290147.0, 151537.0, 60375.0, 22905.0, 9126.0, 3815.0, 1639.0, 815.0, 402.0, 230.0, 156.0, 92.0, 59.0, 43.0, 22.0, 17.0, 21.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.02288818359375, -7.7801513671875, -7.53741455078125, -7.294677734375, -7.05194091796875, -6.8092041015625, -6.56646728515625, -6.32373046875, -6.08099365234375, -5.8382568359375, -5.59552001953125, -5.352783203125, -5.11004638671875, -4.8673095703125, -4.62457275390625, -4.3818359375, -4.13909912109375, -3.8963623046875, -3.65362548828125, -3.410888671875, -3.16815185546875, -2.9254150390625, -2.68267822265625, -2.43994140625, -2.19720458984375, -1.9544677734375, -1.71173095703125, -1.468994140625, -1.22625732421875, -0.9835205078125, -0.74078369140625, -0.498046875, -0.25531005859375, -0.0125732421875, 0.23016357421875, 0.472900390625, 0.71563720703125, 0.9583740234375, 1.20111083984375, 1.44384765625, 1.68658447265625, 1.9293212890625, 2.17205810546875, 2.414794921875, 2.65753173828125, 2.9002685546875, 3.14300537109375, 3.3857421875, 3.62847900390625, 3.8712158203125, 4.11395263671875, 4.356689453125, 4.59942626953125, 4.8421630859375, 5.08489990234375, 5.32763671875, 5.57037353515625, 5.8131103515625, 6.05584716796875, 6.298583984375, 6.54132080078125, 6.7840576171875, 7.02679443359375, 7.26953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 8.0, 15.0, 13.0, 17.0, 19.0, 17.0, 25.0, 38.0, 31.0, 42.0, 46.0, 71.0, 58.0, 50.0, 58.0, 52.0, 47.0, 55.0, 43.0, 30.0, 33.0, 31.0, 27.0, 27.0, 15.0, 13.0, 18.0, 16.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.37042236328125, -1.3238525390625, -1.27728271484375, -1.230712890625, -1.18414306640625, -1.1375732421875, -1.09100341796875, -1.04443359375, -0.99786376953125, -0.9512939453125, -0.90472412109375, -0.858154296875, -0.81158447265625, -0.7650146484375, -0.71844482421875, -0.671875, -0.62530517578125, -0.5787353515625, -0.53216552734375, -0.485595703125, -0.43902587890625, -0.3924560546875, -0.34588623046875, -0.29931640625, -0.25274658203125, -0.2061767578125, -0.15960693359375, -0.113037109375, -0.06646728515625, -0.0198974609375, 0.02667236328125, 0.0732421875, 0.11981201171875, 0.1663818359375, 0.21295166015625, 0.259521484375, 0.30609130859375, 0.3526611328125, 0.39923095703125, 0.44580078125, 0.49237060546875, 0.5389404296875, 0.58551025390625, 0.632080078125, 0.67864990234375, 0.7252197265625, 0.77178955078125, 0.818359375, 0.86492919921875, 0.9114990234375, 0.95806884765625, 1.004638671875, 1.05120849609375, 1.0977783203125, 1.14434814453125, 1.19091796875, 1.23748779296875, 1.2840576171875, 1.33062744140625, 1.377197265625, 1.42376708984375, 1.4703369140625, 1.51690673828125, 1.5634765625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 5.0, 6.0, 14.0, 18.0, 22.0, 26.0, 22.0, 29.0, 34.0, 46.0, 41.0, 53.0, 47.0, 45.0, 44.0, 46.0, 47.0, 47.0, 51.0, 54.0, 42.0, 46.0, 25.0, 28.0, 29.0, 18.0, 20.0, 20.0, 15.0, 9.0, 12.0, 10.0, 5.0, 7.0, 4.0, 2.0, 4.0], "bins": [-92.06939697265625, -89.90866088867188, -87.7479248046875, -85.5871810913086, -83.42644500732422, -81.26570892333984, -79.10497283935547, -76.9442367553711, -74.78349304199219, -72.62275695800781, -70.46202087402344, -68.30127716064453, -66.14054107666016, -63.97980499267578, -61.819068908691406, -59.65833282470703, -57.497596740722656, -55.33686065673828, -53.17612075805664, -51.015384674072266, -48.854644775390625, -46.69390869140625, -44.533172607421875, -42.3724365234375, -40.21169662475586, -38.050960540771484, -35.890220642089844, -33.72948455810547, -31.56874656677246, -29.408008575439453, -27.247272491455078, -25.08653450012207, -22.925800323486328, -20.76506233215332, -18.604324340820312, -16.443588256835938, -14.28285026550293, -12.122112274169922, -9.96137523651123, -7.800638198852539, -5.639900207519531, -3.4791626930236816, -1.318425178527832, 0.8423123359680176, 3.003049850463867, 5.163787841796875, 7.324524879455566, 9.485261917114258, 11.645999908447266, 13.806737899780273, 15.967474937438965, 18.128211975097656, 20.288949966430664, 22.449687957763672, 24.610424041748047, 26.771162033081055, 28.931900024414062, 31.09263801574707, 33.25337600708008, 35.41411209106445, 37.574851989746094, 39.73558807373047, 41.896324157714844, 44.05706024169922, 46.21780014038086]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 8.0, 18.0, 7.0, 12.0, 22.0, 16.0, 24.0, 35.0, 20.0, 23.0, 29.0, 36.0, 37.0, 25.0, 31.0, 38.0, 38.0, 39.0, 46.0, 34.0, 45.0, 39.0, 37.0, 28.0, 22.0, 33.0, 40.0, 29.0, 27.0, 22.0, 19.0, 15.0, 14.0, 14.0, 9.0, 3.0, 12.0, 8.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-62.82893371582031, -61.046478271484375, -59.2640266418457, -57.481571197509766, -55.69911575317383, -53.916664123535156, -52.13420867919922, -50.35175323486328, -48.569297790527344, -46.786842346191406, -45.004390716552734, -43.2219352722168, -41.43947982788086, -39.65702819824219, -37.87457275390625, -36.09211730957031, -34.30966567993164, -32.5272102355957, -30.7447566986084, -28.962303161621094, -27.179847717285156, -25.39739418029785, -23.614940643310547, -21.83248519897461, -20.050031661987305, -18.267578125, -16.485122680664062, -14.702669143676758, -12.920214653015137, -11.137760162353516, -9.355306625366211, -7.57285213470459, -5.790393829345703, -4.007939338684082, -2.225485324859619, -0.44303131103515625, 1.3394231796264648, 3.121877670288086, 4.904331207275391, 6.686785697937012, 8.469240188598633, 10.251694679260254, 12.034149169921875, 13.81660270690918, 15.5990571975708, 17.381511688232422, 19.163965225219727, 20.94641876220703, 22.72887420654297, 24.511327743530273, 26.29378318786621, 28.076236724853516, 29.858692169189453, 31.641145706176758, 33.42359924316406, 35.2060546875, 36.98851013183594, 38.770965576171875, 40.55341720581055, 42.335872650146484, 44.11832809448242, 45.900779724121094, 47.68323516845703, 49.46569061279297, 51.24814224243164]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 13.0, 22.0, 31.0, 34.0, 80.0, 111.0, 177.0, 265.0, 400.0, 644.0, 1055.0, 1798.0, 2974.0, 5285.0, 9544.0, 16776.0, 29014.0, 48286.0, 75929.0, 107305.0, 135026.0, 147042.0, 139357.0, 114342.0, 82199.0, 53526.0, 32988.0, 19083.0, 10638.0, 6040.0, 3380.0, 2016.0, 1126.0, 741.0, 468.0, 260.0, 184.0, 118.0, 97.0, 62.0, 49.0, 22.0, 13.0, 9.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.693359375, -66.44921875, -64.205078125, -61.9609375, -59.716796875, -57.47265625, -55.228515625, -52.984375, -50.740234375, -48.49609375, -46.251953125, -44.0078125, -41.763671875, -39.51953125, -37.275390625, -35.03125, -32.787109375, -30.54296875, -28.298828125, -26.0546875, -23.810546875, -21.56640625, -19.322265625, -17.078125, -14.833984375, -12.58984375, -10.345703125, -8.1015625, -5.857421875, -3.61328125, -1.369140625, 0.875, 3.119140625, 5.36328125, 7.607421875, 9.8515625, 12.095703125, 14.33984375, 16.583984375, 18.828125, 21.072265625, 23.31640625, 25.560546875, 27.8046875, 30.048828125, 32.29296875, 34.537109375, 36.78125, 39.025390625, 41.26953125, 43.513671875, 45.7578125, 48.001953125, 50.24609375, 52.490234375, 54.734375, 56.978515625, 59.22265625, 61.466796875, 63.7109375, 65.955078125, 68.19921875, 70.443359375, 72.6875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 13.0, 20.0, 20.0, 22.0, 34.0, 22.0, 20.0, 33.0, 39.0, 34.0, 25.0, 36.0, 39.0, 43.0, 37.0, 44.0, 35.0, 47.0, 43.0, 26.0, 31.0, 29.0, 37.0, 36.0, 29.0, 25.0, 18.0, 14.0, 17.0, 15.0, 12.0, 4.0, 10.0, 9.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-63.15625, -61.34814453125, -59.5400390625, -57.73193359375, -55.923828125, -54.11572265625, -52.3076171875, -50.49951171875, -48.69140625, -46.88330078125, -45.0751953125, -43.26708984375, -41.458984375, -39.65087890625, -37.8427734375, -36.03466796875, -34.2265625, -32.41845703125, -30.6103515625, -28.80224609375, -26.994140625, -25.18603515625, -23.3779296875, -21.56982421875, -19.76171875, -17.95361328125, -16.1455078125, -14.33740234375, -12.529296875, -10.72119140625, -8.9130859375, -7.10498046875, -5.296875, -3.48876953125, -1.6806640625, 0.12744140625, 1.935546875, 3.74365234375, 5.5517578125, 7.35986328125, 9.16796875, 10.97607421875, 12.7841796875, 14.59228515625, 16.400390625, 18.20849609375, 20.0166015625, 21.82470703125, 23.6328125, 25.44091796875, 27.2490234375, 29.05712890625, 30.865234375, 32.67333984375, 34.4814453125, 36.28955078125, 38.09765625, 39.90576171875, 41.7138671875, 43.52197265625, 45.330078125, 47.13818359375, 48.9462890625, 50.75439453125, 52.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 5.0, 5.0, 24.0, 25.0, 48.0, 56.0, 94.0, 140.0, 191.0, 276.0, 448.0, 636.0, 996.0, 1483.0, 2353.0, 3777.0, 6082.0, 10086.0, 17115.0, 28073.0, 45244.0, 69942.0, 98908.0, 126951.0, 142416.0, 138377.0, 115862.0, 85563.0, 58079.0, 37091.0, 22561.0, 13524.0, 8290.0, 5013.0, 3177.0, 1963.0, 1259.0, 763.0, 566.0, 363.0, 240.0, 158.0, 115.0, 68.0, 58.0, 28.0, 18.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-79.75, -77.3173828125, -74.884765625, -72.4521484375, -70.01953125, -67.5869140625, -65.154296875, -62.7216796875, -60.2890625, -57.8564453125, -55.423828125, -52.9912109375, -50.55859375, -48.1259765625, -45.693359375, -43.2607421875, -40.828125, -38.3955078125, -35.962890625, -33.5302734375, -31.09765625, -28.6650390625, -26.232421875, -23.7998046875, -21.3671875, -18.9345703125, -16.501953125, -14.0693359375, -11.63671875, -9.2041015625, -6.771484375, -4.3388671875, -1.90625, 0.5263671875, 2.958984375, 5.3916015625, 7.82421875, 10.2568359375, 12.689453125, 15.1220703125, 17.5546875, 19.9873046875, 22.419921875, 24.8525390625, 27.28515625, 29.7177734375, 32.150390625, 34.5830078125, 37.015625, 39.4482421875, 41.880859375, 44.3134765625, 46.74609375, 49.1787109375, 51.611328125, 54.0439453125, 56.4765625, 58.9091796875, 61.341796875, 63.7744140625, 66.20703125, 68.6396484375, 71.072265625, 73.5048828125, 75.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 10.0, 7.0, 14.0, 9.0, 17.0, 14.0, 14.0, 27.0, 32.0, 30.0, 33.0, 37.0, 34.0, 48.0, 46.0, 35.0, 39.0, 51.0, 42.0, 35.0, 46.0, 42.0, 33.0, 33.0, 36.0, 33.0, 21.0, 25.0, 16.0, 21.0, 20.0, 23.0, 10.0, 13.0, 7.0, 13.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -34.94482421875, -33.7333984375, -32.52197265625, -31.310546875, -30.09912109375, -28.8876953125, -27.67626953125, -26.46484375, -25.25341796875, -24.0419921875, -22.83056640625, -21.619140625, -20.40771484375, -19.1962890625, -17.98486328125, -16.7734375, -15.56201171875, -14.3505859375, -13.13916015625, -11.927734375, -10.71630859375, -9.5048828125, -8.29345703125, -7.08203125, -5.87060546875, -4.6591796875, -3.44775390625, -2.236328125, -1.02490234375, 0.1865234375, 1.39794921875, 2.609375, 3.82080078125, 5.0322265625, 6.24365234375, 7.455078125, 8.66650390625, 9.8779296875, 11.08935546875, 12.30078125, 13.51220703125, 14.7236328125, 15.93505859375, 17.146484375, 18.35791015625, 19.5693359375, 20.78076171875, 21.9921875, 23.20361328125, 24.4150390625, 25.62646484375, 26.837890625, 28.04931640625, 29.2607421875, 30.47216796875, 31.68359375, 32.89501953125, 34.1064453125, 35.31787109375, 36.529296875, 37.74072265625, 38.9521484375, 40.16357421875, 41.375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 23.0, 24.0, 40.0, 68.0, 90.0, 123.0, 202.0, 323.0, 467.0, 684.0, 1080.0, 1618.0, 2529.0, 3866.0, 6005.0, 9517.0, 14857.0, 23139.0, 35281.0, 52759.0, 74891.0, 99049.0, 119334.0, 128011.0, 121432.0, 104619.0, 80654.0, 57572.0, 39025.0, 25472.0, 16312.0, 10361.0, 6739.0, 4398.0, 2716.0, 1773.0, 1172.0, 785.0, 504.0, 354.0, 219.0, 171.0, 86.0, 70.0, 42.0, 23.0, 27.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0625, -13.587646484375, -13.11279296875, -12.637939453125, -12.1630859375, -11.688232421875, -11.21337890625, -10.738525390625, -10.263671875, -9.788818359375, -9.31396484375, -8.839111328125, -8.3642578125, -7.889404296875, -7.41455078125, -6.939697265625, -6.46484375, -5.989990234375, -5.51513671875, -5.040283203125, -4.5654296875, -4.090576171875, -3.61572265625, -3.140869140625, -2.666015625, -2.191162109375, -1.71630859375, -1.241455078125, -0.7666015625, -0.291748046875, 0.18310546875, 0.657958984375, 1.1328125, 1.607666015625, 2.08251953125, 2.557373046875, 3.0322265625, 3.507080078125, 3.98193359375, 4.456787109375, 4.931640625, 5.406494140625, 5.88134765625, 6.356201171875, 6.8310546875, 7.305908203125, 7.78076171875, 8.255615234375, 8.73046875, 9.205322265625, 9.68017578125, 10.155029296875, 10.6298828125, 11.104736328125, 11.57958984375, 12.054443359375, 12.529296875, 13.004150390625, 13.47900390625, 13.953857421875, 14.4287109375, 14.903564453125, 15.37841796875, 15.853271484375, 16.328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 3.0, 13.0, 8.0, 14.0, 17.0, 23.0, 30.0, 35.0, 42.0, 53.0, 64.0, 63.0, 71.0, 73.0, 69.0, 69.0, 72.0, 53.0, 49.0, 44.0, 31.0, 23.0, 19.0, 11.0, 19.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028591156005859375, -0.0027809441089630127, -0.002702772617340088, -0.002624601125717163, -0.0025464296340942383, -0.0024682581424713135, -0.0023900866508483887, -0.002311915159225464, -0.002233743667602539, -0.0021555721759796143, -0.0020774006843566895, -0.0019992291927337646, -0.0019210577011108398, -0.001842886209487915, -0.0017647147178649902, -0.0016865432262420654, -0.0016083717346191406, -0.0015302002429962158, -0.001452028751373291, -0.0013738572597503662, -0.0012956857681274414, -0.0012175142765045166, -0.0011393427848815918, -0.001061171293258667, -0.0009829998016357422, -0.0009048283100128174, -0.0008266568183898926, -0.0007484853267669678, -0.000670313835144043, -0.0005921423435211182, -0.0005139708518981934, -0.00043579936027526855, -0.00035762786865234375, -0.00027945637702941895, -0.00020128488540649414, -0.00012311339378356934, -4.494190216064453e-05, 3.3229589462280273e-05, 0.00011140108108520508, 0.00018957257270812988, 0.0002677440643310547, 0.0003459155559539795, 0.0004240870475769043, 0.0005022585391998291, 0.0005804300308227539, 0.0006586015224456787, 0.0007367730140686035, 0.0008149445056915283, 0.0008931159973144531, 0.0009712874889373779, 0.0010494589805603027, 0.0011276304721832275, 0.0012058019638061523, 0.0012839734554290771, 0.001362144947052002, 0.0014403164386749268, 0.0015184879302978516, 0.0015966594219207764, 0.0016748309135437012, 0.001753002405166626, 0.0018311738967895508, 0.0019093453884124756, 0.0019875168800354004, 0.002065688371658325, 0.00214385986328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 32.0, 32.0, 61.0, 74.0, 99.0, 155.0, 256.0, 351.0, 579.0, 893.0, 1343.0, 2156.0, 3288.0, 5144.0, 8244.0, 12763.0, 19728.0, 29843.0, 44074.0, 61781.0, 82483.0, 102674.0, 116517.0, 119695.0, 110736.0, 93304.0, 73067.0, 53043.0, 36491.0, 24690.0, 16037.0, 10327.0, 6573.0, 4262.0, 2800.0, 1752.0, 1113.0, 721.0, 430.0, 313.0, 214.0, 122.0, 82.0, 65.0, 33.0, 32.0, 26.0, 15.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.828125, -13.3712158203125, -12.914306640625, -12.4573974609375, -12.00048828125, -11.5435791015625, -11.086669921875, -10.6297607421875, -10.1728515625, -9.7159423828125, -9.259033203125, -8.8021240234375, -8.34521484375, -7.8883056640625, -7.431396484375, -6.9744873046875, -6.517578125, -6.0606689453125, -5.603759765625, -5.1468505859375, -4.68994140625, -4.2330322265625, -3.776123046875, -3.3192138671875, -2.8623046875, -2.4053955078125, -1.948486328125, -1.4915771484375, -1.03466796875, -0.5777587890625, -0.120849609375, 0.3360595703125, 0.79296875, 1.2498779296875, 1.706787109375, 2.1636962890625, 2.62060546875, 3.0775146484375, 3.534423828125, 3.9913330078125, 4.4482421875, 4.9051513671875, 5.362060546875, 5.8189697265625, 6.27587890625, 6.7327880859375, 7.189697265625, 7.6466064453125, 8.103515625, 8.5604248046875, 9.017333984375, 9.4742431640625, 9.93115234375, 10.3880615234375, 10.844970703125, 11.3018798828125, 11.7587890625, 12.2156982421875, 12.672607421875, 13.1295166015625, 13.58642578125, 14.0433349609375, 14.500244140625, 14.9571533203125, 15.4140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 11.0, 11.0, 7.0, 7.0, 15.0, 10.0, 16.0, 27.0, 16.0, 33.0, 33.0, 44.0, 45.0, 28.0, 49.0, 54.0, 56.0, 41.0, 48.0, 55.0, 50.0, 45.0, 44.0, 41.0, 39.0, 30.0, 17.0, 26.0, 22.0, 14.0, 9.0, 11.0, 13.0, 8.0, 10.0, 1.0, 5.0, 2.0, 0.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.34375, -8.1080322265625, -7.872314453125, -7.6365966796875, -7.40087890625, -7.1651611328125, -6.929443359375, -6.6937255859375, -6.4580078125, -6.2222900390625, -5.986572265625, -5.7508544921875, -5.51513671875, -5.2794189453125, -5.043701171875, -4.8079833984375, -4.572265625, -4.3365478515625, -4.100830078125, -3.8651123046875, -3.62939453125, -3.3936767578125, -3.157958984375, -2.9222412109375, -2.6865234375, -2.4508056640625, -2.215087890625, -1.9793701171875, -1.74365234375, -1.5079345703125, -1.272216796875, -1.0364990234375, -0.80078125, -0.5650634765625, -0.329345703125, -0.0936279296875, 0.14208984375, 0.3778076171875, 0.613525390625, 0.8492431640625, 1.0849609375, 1.3206787109375, 1.556396484375, 1.7921142578125, 2.02783203125, 2.2635498046875, 2.499267578125, 2.7349853515625, 2.970703125, 3.2064208984375, 3.442138671875, 3.6778564453125, 3.91357421875, 4.1492919921875, 4.385009765625, 4.6207275390625, 4.8564453125, 5.0921630859375, 5.327880859375, 5.5635986328125, 5.79931640625, 6.0350341796875, 6.270751953125, 6.5064697265625, 6.7421875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 6.0, 10.0, 12.0, 13.0, 15.0, 14.0, 19.0, 25.0, 26.0, 29.0, 27.0, 35.0, 35.0, 34.0, 45.0, 44.0, 59.0, 38.0, 37.0, 48.0, 39.0, 39.0, 41.0, 33.0, 28.0, 37.0, 34.0, 27.0, 15.0, 20.0, 19.0, 13.0, 15.0, 12.0, 14.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.18128967285156, -63.26628494262695, -61.351280212402344, -59.436275482177734, -57.521270751953125, -55.606266021728516, -53.691261291503906, -51.7762565612793, -49.86125183105469, -47.94624710083008, -46.03124237060547, -44.11623764038086, -42.20123291015625, -40.28622817993164, -38.37122344970703, -36.45621871948242, -34.54121398925781, -32.6262092590332, -30.711204528808594, -28.796199798583984, -26.881195068359375, -24.966190338134766, -23.051185607910156, -21.136180877685547, -19.221176147460938, -17.306171417236328, -15.391166687011719, -13.47616195678711, -11.5611572265625, -9.64615249633789, -7.731147766113281, -5.816143035888672, -3.9011383056640625, -1.9861335754394531, -0.07112884521484375, 1.8438758850097656, 3.758880615234375, 5.673885345458984, 7.588890075683594, 9.503894805908203, 11.418899536132812, 13.333904266357422, 15.248908996582031, 17.16391372680664, 19.07891845703125, 20.99392318725586, 22.90892791748047, 24.823932647705078, 26.738937377929688, 28.653942108154297, 30.568946838378906, 32.483951568603516, 34.398956298828125, 36.313961029052734, 38.228965759277344, 40.14397048950195, 42.05897521972656, 43.97397994995117, 45.88898468017578, 47.80398941040039, 49.718994140625, 51.63399887084961, 53.54900360107422, 55.46400833129883, 57.37901306152344]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 5.0, 13.0, 13.0, 14.0, 14.0, 15.0, 18.0, 18.0, 24.0, 24.0, 15.0, 28.0, 25.0, 27.0, 43.0, 40.0, 26.0, 43.0, 38.0, 35.0, 33.0, 44.0, 37.0, 33.0, 30.0, 36.0, 37.0, 27.0, 28.0, 33.0, 20.0, 28.0, 18.0, 16.0, 14.0, 13.0, 11.0, 8.0, 10.0, 7.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.16705322265625, -54.35741424560547, -52.54777908325195, -50.73814010620117, -48.92850112915039, -47.118865966796875, -45.309226989746094, -43.49958801269531, -41.68994903564453, -39.88031005859375, -38.070674896240234, -36.26103591918945, -34.45139694213867, -32.641761779785156, -30.832122802734375, -29.022483825683594, -27.212848663330078, -25.40321159362793, -23.59357261657715, -21.783935546875, -19.97429656982422, -18.16465950012207, -16.355022430419922, -14.545384407043457, -12.735746383666992, -10.926108360290527, -9.116470336914062, -7.306833267211914, -5.497195243835449, -3.6875572204589844, -1.877920150756836, -0.0682821273803711, 1.7413597106933594, 3.550997495651245, 5.360635280609131, 7.1702728271484375, 8.979910850524902, 10.789548873901367, 12.599185943603516, 14.40882396697998, 16.218461990356445, 18.028099060058594, 19.837738037109375, 21.647375106811523, 23.457012176513672, 25.266651153564453, 27.0762882232666, 28.88592529296875, 30.69556427001953, 32.50520324707031, 34.31483840942383, 36.12447738647461, 37.93411636352539, 39.743751525878906, 41.55339050292969, 43.36302947998047, 45.17266845703125, 46.98230743408203, 48.79194259643555, 50.60158157348633, 52.41122055053711, 54.220855712890625, 56.030494689941406, 57.84013366699219, 59.6497688293457]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 17.0, 24.0, 38.0, 61.0, 70.0, 136.0, 198.0, 348.0, 498.0, 784.0, 1193.0, 1968.0, 3114.0, 4883.0, 7999.0, 12563.0, 19346.0, 30379.0, 47212.0, 73457.0, 111603.0, 166203.0, 239627.0, 329306.0, 422832.0, 494039.0, 510119.0, 465316.0, 379643.0, 282874.0, 200389.0, 135679.0, 89448.0, 58529.0, 37780.0, 23956.0, 15367.0, 9803.0, 6309.0, 3970.0, 2620.0, 1659.0, 1086.0, 631.0, 419.0, 276.0, 182.0, 121.0, 71.0, 35.0, 31.0, 21.0, 19.0, 12.0, 6.0, 5.0, 4.0, 1.0], "bins": [-56.96875, -55.2021484375, -53.435546875, -51.6689453125, -49.90234375, -48.1357421875, -46.369140625, -44.6025390625, -42.8359375, -41.0693359375, -39.302734375, -37.5361328125, -35.76953125, -34.0029296875, -32.236328125, -30.4697265625, -28.703125, -26.9365234375, -25.169921875, -23.4033203125, -21.63671875, -19.8701171875, -18.103515625, -16.3369140625, -14.5703125, -12.8037109375, -11.037109375, -9.2705078125, -7.50390625, -5.7373046875, -3.970703125, -2.2041015625, -0.4375, 1.3291015625, 3.095703125, 4.8623046875, 6.62890625, 8.3955078125, 10.162109375, 11.9287109375, 13.6953125, 15.4619140625, 17.228515625, 18.9951171875, 20.76171875, 22.5283203125, 24.294921875, 26.0615234375, 27.828125, 29.5947265625, 31.361328125, 33.1279296875, 34.89453125, 36.6611328125, 38.427734375, 40.1943359375, 41.9609375, 43.7275390625, 45.494140625, 47.2607421875, 49.02734375, 50.7939453125, 52.560546875, 54.3271484375, 56.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 7.0, 10.0, 12.0, 15.0, 15.0, 17.0, 16.0, 13.0, 31.0, 17.0, 26.0, 23.0, 20.0, 30.0, 40.0, 40.0, 28.0, 38.0, 44.0, 25.0, 36.0, 43.0, 35.0, 35.0, 30.0, 37.0, 35.0, 27.0, 27.0, 29.0, 27.0, 25.0, 21.0, 18.0, 12.0, 12.0, 12.0, 7.0, 10.0, 11.0, 10.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.03125, -47.46875, -45.90625, -44.34375, -42.78125, -41.21875, -39.65625, -38.09375, -36.53125, -34.96875, -33.40625, -31.84375, -30.28125, -28.71875, -27.15625, -25.59375, -24.03125, -22.46875, -20.90625, -19.34375, -17.78125, -16.21875, -14.65625, -13.09375, -11.53125, -9.96875, -8.40625, -6.84375, -5.28125, -3.71875, -2.15625, -0.59375, 0.96875, 2.53125, 4.09375, 5.65625, 7.21875, 8.78125, 10.34375, 11.90625, 13.46875, 15.03125, 16.59375, 18.15625, 19.71875, 21.28125, 22.84375, 24.40625, 25.96875, 27.53125, 29.09375, 30.65625, 32.21875, 33.78125, 35.34375, 36.90625, 38.46875, 40.03125, 41.59375, 43.15625, 44.71875, 46.28125, 47.84375, 49.40625, 50.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 42.0, 69.0, 120.0, 155.0, 246.0, 378.0, 726.0, 1250.0, 2134.0, 3834.0, 6950.0, 12806.0, 23908.0, 43825.0, 80598.0, 143223.0, 241744.0, 380137.0, 535252.0, 646465.0, 640993.0, 524491.0, 367146.0, 231874.0, 136760.0, 76565.0, 42223.0, 22903.0, 12034.0, 6843.0, 3637.0, 2009.0, 1158.0, 621.0, 378.0, 268.0, 152.0, 87.0, 56.0, 44.0, 31.0, 22.0, 17.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-74.125, -71.8056640625, -69.486328125, -67.1669921875, -64.84765625, -62.5283203125, -60.208984375, -57.8896484375, -55.5703125, -53.2509765625, -50.931640625, -48.6123046875, -46.29296875, -43.9736328125, -41.654296875, -39.3349609375, -37.015625, -34.6962890625, -32.376953125, -30.0576171875, -27.73828125, -25.4189453125, -23.099609375, -20.7802734375, -18.4609375, -16.1416015625, -13.822265625, -11.5029296875, -9.18359375, -6.8642578125, -4.544921875, -2.2255859375, 0.09375, 2.4130859375, 4.732421875, 7.0517578125, 9.37109375, 11.6904296875, 14.009765625, 16.3291015625, 18.6484375, 20.9677734375, 23.287109375, 25.6064453125, 27.92578125, 30.2451171875, 32.564453125, 34.8837890625, 37.203125, 39.5224609375, 41.841796875, 44.1611328125, 46.48046875, 48.7998046875, 51.119140625, 53.4384765625, 55.7578125, 58.0771484375, 60.396484375, 62.7158203125, 65.03515625, 67.3544921875, 69.673828125, 71.9931640625, 74.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 9.0, 8.0, 17.0, 13.0, 32.0, 34.0, 30.0, 48.0, 48.0, 69.0, 83.0, 83.0, 102.0, 106.0, 141.0, 160.0, 180.0, 184.0, 201.0, 223.0, 196.0, 224.0, 235.0, 209.0, 191.0, 180.0, 146.0, 154.0, 130.0, 107.0, 84.0, 81.0, 72.0, 68.0, 51.0, 42.0, 32.0, 23.0, 21.0, 18.0, 9.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.265625, -26.41650390625, -25.5673828125, -24.71826171875, -23.869140625, -23.02001953125, -22.1708984375, -21.32177734375, -20.47265625, -19.62353515625, -18.7744140625, -17.92529296875, -17.076171875, -16.22705078125, -15.3779296875, -14.52880859375, -13.6796875, -12.83056640625, -11.9814453125, -11.13232421875, -10.283203125, -9.43408203125, -8.5849609375, -7.73583984375, -6.88671875, -6.03759765625, -5.1884765625, -4.33935546875, -3.490234375, -2.64111328125, -1.7919921875, -0.94287109375, -0.09375, 0.75537109375, 1.6044921875, 2.45361328125, 3.302734375, 4.15185546875, 5.0009765625, 5.85009765625, 6.69921875, 7.54833984375, 8.3974609375, 9.24658203125, 10.095703125, 10.94482421875, 11.7939453125, 12.64306640625, 13.4921875, 14.34130859375, 15.1904296875, 16.03955078125, 16.888671875, 17.73779296875, 18.5869140625, 19.43603515625, 20.28515625, 21.13427734375, 21.9833984375, 22.83251953125, 23.681640625, 24.53076171875, 25.3798828125, 26.22900390625, 27.078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 5.0, 6.0, 8.0, 9.0, 14.0, 13.0, 22.0, 18.0, 23.0, 32.0, 27.0, 35.0, 30.0, 42.0, 47.0, 44.0, 38.0, 49.0, 43.0, 48.0, 37.0, 33.0, 32.0, 46.0, 43.0, 30.0, 44.0, 34.0, 18.0, 20.0, 18.0, 13.0, 17.0, 9.0, 9.0, 5.0, 12.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-66.95327758789062, -64.97203826904297, -62.99079132080078, -61.00954818725586, -59.02830505371094, -57.04706573486328, -55.06582260131836, -53.08457946777344, -51.103336334228516, -49.122093200683594, -47.14085006713867, -45.15960693359375, -43.178367614746094, -41.197120666503906, -39.21588134765625, -37.23463821411133, -35.253395080566406, -33.272151947021484, -31.290908813476562, -29.309667587280273, -27.32842445373535, -25.34718132019043, -23.36594009399414, -21.38469696044922, -19.403453826904297, -17.422210693359375, -15.44096851348877, -13.459726333618164, -11.478483200073242, -9.49724006652832, -7.515997886657715, -5.534755706787109, -3.5535125732421875, -1.5722699165344238, 0.40897274017333984, 2.3902153968811035, 4.371458053588867, 6.352701187133789, 8.333943367004395, 10.315185546875, 12.296428680419922, 14.277671813964844, 16.258914947509766, 18.240156173706055, 20.221399307250977, 22.2026424407959, 24.183883666992188, 26.16512680053711, 28.14636993408203, 30.127613067626953, 32.108856201171875, 34.0900993347168, 36.07134246826172, 38.052581787109375, 40.0338249206543, 42.01506805419922, 43.99631118774414, 45.97755432128906, 47.958797454833984, 49.940040588378906, 51.92127990722656, 53.90252685546875, 55.883766174316406, 57.86500930786133, 59.84625244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 7.0, 6.0, 10.0, 14.0, 12.0, 13.0, 15.0, 17.0, 11.0, 22.0, 29.0, 30.0, 28.0, 35.0, 36.0, 34.0, 43.0, 29.0, 42.0, 45.0, 40.0, 49.0, 46.0, 30.0, 37.0, 36.0, 25.0, 38.0, 31.0, 31.0, 19.0, 22.0, 22.0, 14.0, 17.0, 12.0, 6.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.89384078979492, -53.91671371459961, -51.9395866394043, -49.96245574951172, -47.985328674316406, -46.008201599121094, -44.03107452392578, -42.05394744873047, -40.076820373535156, -38.099693298339844, -36.12256622314453, -34.14543914794922, -32.16830825805664, -30.191181182861328, -28.214054107666016, -26.236927032470703, -24.259796142578125, -22.282669067382812, -20.305540084838867, -18.328413009643555, -16.35128402709961, -14.374156951904297, -12.397029876708984, -10.419901847839355, -8.442773818969727, -6.465645790100098, -4.488518238067627, -2.5113906860351562, -0.5342626571655273, 1.4428653717041016, 3.419992446899414, 5.397120475769043, 7.3742523193359375, 9.351380348205566, 11.328508377075195, 13.305635452270508, 15.282763481140137, 17.259891510009766, 19.237018585205078, 21.21414566040039, 23.191274642944336, 25.16840171813965, 27.145530700683594, 29.122657775878906, 31.09978485107422, 33.07691192626953, 35.054039001464844, 37.03116989135742, 39.008296966552734, 40.98542404174805, 42.96255111694336, 44.93968200683594, 46.91680908203125, 48.89393615722656, 50.871063232421875, 52.84819030761719, 54.8253173828125, 56.80244445800781, 58.779571533203125, 60.75669860839844, 62.733829498291016, 64.71095275878906, 66.68807983398438, 68.66521453857422, 70.64234161376953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 2.0, 20.0, 28.0, 31.0, 60.0, 80.0, 117.0, 189.0, 346.0, 494.0, 725.0, 1171.0, 1862.0, 2890.0, 4407.0, 7115.0, 11148.0, 17391.0, 26691.0, 39669.0, 57090.0, 77675.0, 99170.0, 115209.0, 121406.0, 115026.0, 99080.0, 78407.0, 57105.0, 39580.0, 26534.0, 17482.0, 11035.0, 7010.0, 4471.0, 2827.0, 1746.0, 1219.0, 720.0, 460.0, 304.0, 196.0, 116.0, 85.0, 50.0, 41.0, 22.0, 15.0, 8.0, 14.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.74609375, -25.7734375, -24.80078125, -23.828125, -22.85546875, -21.8828125, -20.91015625, -19.9375, -18.96484375, -17.9921875, -17.01953125, -16.046875, -15.07421875, -14.1015625, -13.12890625, -12.15625, -11.18359375, -10.2109375, -9.23828125, -8.265625, -7.29296875, -6.3203125, -5.34765625, -4.375, -3.40234375, -2.4296875, -1.45703125, -0.484375, 0.48828125, 1.4609375, 2.43359375, 3.40625, 4.37890625, 5.3515625, 6.32421875, 7.296875, 8.26953125, 9.2421875, 10.21484375, 11.1875, 12.16015625, 13.1328125, 14.10546875, 15.078125, 16.05078125, 17.0234375, 17.99609375, 18.96875, 19.94140625, 20.9140625, 21.88671875, 22.859375, 23.83203125, 24.8046875, 25.77734375, 26.75, 27.72265625, 28.6953125, 29.66796875, 30.640625, 31.61328125, 32.5859375, 33.55859375, 34.53125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 3.0, 12.0, 13.0, 13.0, 9.0, 17.0, 13.0, 20.0, 19.0, 21.0, 30.0, 34.0, 29.0, 34.0, 42.0, 39.0, 29.0, 40.0, 49.0, 32.0, 44.0, 41.0, 47.0, 36.0, 29.0, 35.0, 32.0, 33.0, 29.0, 24.0, 24.0, 17.0, 18.0, 13.0, 15.0, 10.0, 6.0, 7.0, 13.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.03125, -53.98583984375, -51.9404296875, -49.89501953125, -47.849609375, -45.80419921875, -43.7587890625, -41.71337890625, -39.66796875, -37.62255859375, -35.5771484375, -33.53173828125, -31.486328125, -29.44091796875, -27.3955078125, -25.35009765625, -23.3046875, -21.25927734375, -19.2138671875, -17.16845703125, -15.123046875, -13.07763671875, -11.0322265625, -8.98681640625, -6.94140625, -4.89599609375, -2.8505859375, -0.80517578125, 1.240234375, 3.28564453125, 5.3310546875, 7.37646484375, 9.421875, 11.46728515625, 13.5126953125, 15.55810546875, 17.603515625, 19.64892578125, 21.6943359375, 23.73974609375, 25.78515625, 27.83056640625, 29.8759765625, 31.92138671875, 33.966796875, 36.01220703125, 38.0576171875, 40.10302734375, 42.1484375, 44.19384765625, 46.2392578125, 48.28466796875, 50.330078125, 52.37548828125, 54.4208984375, 56.46630859375, 58.51171875, 60.55712890625, 62.6025390625, 64.64794921875, 66.693359375, 68.73876953125, 70.7841796875, 72.82958984375, 74.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 3.0, 17.0, 16.0, 27.0, 42.0, 41.0, 55.0, 82.0, 117.0, 139.0, 230.0, 351.0, 422.0, 685.0, 1009.0, 1491.0, 2145.0, 3177.0, 4888.0, 7677.0, 11506.0, 17810.0, 29831.0, 287047.0, 587386.0, 34705.0, 19876.0, 12723.0, 8289.0, 5356.0, 3622.0, 2416.0, 1625.0, 1155.0, 782.0, 561.0, 351.0, 248.0, 172.0, 139.0, 100.0, 67.0, 63.0, 31.0, 28.0, 12.0, 9.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0, 3.0], "bins": [-66.5, -64.55029296875, -62.6005859375, -60.65087890625, -58.701171875, -56.75146484375, -54.8017578125, -52.85205078125, -50.90234375, -48.95263671875, -47.0029296875, -45.05322265625, -43.103515625, -41.15380859375, -39.2041015625, -37.25439453125, -35.3046875, -33.35498046875, -31.4052734375, -29.45556640625, -27.505859375, -25.55615234375, -23.6064453125, -21.65673828125, -19.70703125, -17.75732421875, -15.8076171875, -13.85791015625, -11.908203125, -9.95849609375, -8.0087890625, -6.05908203125, -4.109375, -2.15966796875, -0.2099609375, 1.73974609375, 3.689453125, 5.63916015625, 7.5888671875, 9.53857421875, 11.48828125, 13.43798828125, 15.3876953125, 17.33740234375, 19.287109375, 21.23681640625, 23.1865234375, 25.13623046875, 27.0859375, 29.03564453125, 30.9853515625, 32.93505859375, 34.884765625, 36.83447265625, 38.7841796875, 40.73388671875, 42.68359375, 44.63330078125, 46.5830078125, 48.53271484375, 50.482421875, 52.43212890625, 54.3818359375, 56.33154296875, 58.28125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 16.0, 12.0, 12.0, 8.0, 34.0, 29.0, 28.0, 30.0, 35.0, 32.0, 34.0, 45.0, 32.0, 46.0, 48.0, 34.0, 42.0, 43.0, 44.0, 43.0, 44.0, 46.0, 38.0, 33.0, 24.0, 16.0, 20.0, 14.0, 8.0, 15.0, 13.0, 10.0, 13.0, 6.0, 7.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0751953125, -49.462890625, -47.8505859375, -46.23828125, -44.6259765625, -43.013671875, -41.4013671875, -39.7890625, -38.1767578125, -36.564453125, -34.9521484375, -33.33984375, -31.7275390625, -30.115234375, -28.5029296875, -26.890625, -25.2783203125, -23.666015625, -22.0537109375, -20.44140625, -18.8291015625, -17.216796875, -15.6044921875, -13.9921875, -12.3798828125, -10.767578125, -9.1552734375, -7.54296875, -5.9306640625, -4.318359375, -2.7060546875, -1.09375, 0.5185546875, 2.130859375, 3.7431640625, 5.35546875, 6.9677734375, 8.580078125, 10.1923828125, 11.8046875, 13.4169921875, 15.029296875, 16.6416015625, 18.25390625, 19.8662109375, 21.478515625, 23.0908203125, 24.703125, 26.3154296875, 27.927734375, 29.5400390625, 31.15234375, 32.7646484375, 34.376953125, 35.9892578125, 37.6015625, 39.2138671875, 40.826171875, 42.4384765625, 44.05078125, 45.6630859375, 47.275390625, 48.8876953125, 50.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 4.0, 6.0, 21.0, 22.0, 29.0, 41.0, 59.0, 82.0, 132.0, 185.0, 287.0, 467.0, 708.0, 1050.0, 1867.0, 3127.0, 5640.0, 10474.0, 20405.0, 51378.0, 804085.0, 94663.0, 24992.0, 12572.0, 6808.0, 3780.0, 2033.0, 1248.0, 847.0, 497.0, 328.0, 217.0, 132.0, 95.0, 82.0, 54.0, 29.0, 29.0, 18.0, 9.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08984375, -5.877197265625, -5.66455078125, -5.451904296875, -5.2392578125, -5.026611328125, -4.81396484375, -4.601318359375, -4.388671875, -4.176025390625, -3.96337890625, -3.750732421875, -3.5380859375, -3.325439453125, -3.11279296875, -2.900146484375, -2.6875, -2.474853515625, -2.26220703125, -2.049560546875, -1.8369140625, -1.624267578125, -1.41162109375, -1.198974609375, -0.986328125, -0.773681640625, -0.56103515625, -0.348388671875, -0.1357421875, 0.076904296875, 0.28955078125, 0.502197265625, 0.71484375, 0.927490234375, 1.14013671875, 1.352783203125, 1.5654296875, 1.778076171875, 1.99072265625, 2.203369140625, 2.416015625, 2.628662109375, 2.84130859375, 3.053955078125, 3.2666015625, 3.479248046875, 3.69189453125, 3.904541015625, 4.1171875, 4.329833984375, 4.54248046875, 4.755126953125, 4.9677734375, 5.180419921875, 5.39306640625, 5.605712890625, 5.818359375, 6.031005859375, 6.24365234375, 6.456298828125, 6.6689453125, 6.881591796875, 7.09423828125, 7.306884765625, 7.51953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 12.0, 8.0, 10.0, 16.0, 4.0, 16.0, 22.0, 22.0, 31.0, 31.0, 33.0, 41.0, 55.0, 66.0, 53.0, 54.0, 52.0, 55.0, 61.0, 54.0, 43.0, 34.0, 42.0, 28.0, 30.0, 25.0, 19.0, 15.0, 4.0, 12.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0009131431579589844, -0.0008829161524772644, -0.0008526891469955444, -0.0008224621415138245, -0.0007922351360321045, -0.0007620081305503845, -0.0007317811250686646, -0.0007015541195869446, -0.0006713271141052246, -0.0006411001086235046, -0.0006108731031417847, -0.0005806460976600647, -0.0005504190921783447, -0.0005201920866966248, -0.0004899650812149048, -0.0004597380757331848, -0.00042951107025146484, -0.0003992840647697449, -0.0003690570592880249, -0.00033883005380630493, -0.00030860304832458496, -0.000278376042842865, -0.000248149037361145, -0.00021792203187942505, -0.00018769502639770508, -0.0001574680209159851, -0.00012724101543426514, -9.701400995254517e-05, -6.67870044708252e-05, -3.6559998989105225e-05, -6.332993507385254e-06, 2.3894011974334717e-05, 5.412101745605469e-05, 8.434802293777466e-05, 0.00011457502841949463, 0.0001448020339012146, 0.00017502903938293457, 0.00020525604486465454, 0.0002354830503463745, 0.0002657100558280945, 0.00029593706130981445, 0.0003261640667915344, 0.0003563910722732544, 0.00038661807775497437, 0.00041684508323669434, 0.0004470720887184143, 0.0004772990942001343, 0.0005075260996818542, 0.0005377531051635742, 0.0005679801106452942, 0.0005982071161270142, 0.0006284341216087341, 0.0006586611270904541, 0.0006888881325721741, 0.000719115138053894, 0.000749342143535614, 0.000779569149017334, 0.000809796154499054, 0.0008400231599807739, 0.0008702501654624939, 0.0009004771709442139, 0.0009307041764259338, 0.0009609311819076538, 0.0009911581873893738, 0.0010213851928710938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 9.0, 20.0, 24.0, 36.0, 40.0, 66.0, 108.0, 154.0, 211.0, 303.0, 480.0, 743.0, 1007.0, 1552.0, 2364.0, 3465.0, 5076.0, 7742.0, 11775.0, 17454.0, 26043.0, 37878.0, 52949.0, 71034.0, 90389.0, 105971.0, 114173.0, 111468.0, 99676.0, 81631.0, 62521.0, 45205.0, 31775.0, 21804.0, 14410.0, 9751.0, 6430.0, 4269.0, 2806.0, 1830.0, 1235.0, 880.0, 577.0, 396.0, 265.0, 198.0, 111.0, 96.0, 61.0, 41.0, 27.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.09375, -2.023406982421875, -1.95306396484375, -1.882720947265625, -1.8123779296875, -1.742034912109375, -1.67169189453125, -1.601348876953125, -1.531005859375, -1.460662841796875, -1.39031982421875, -1.319976806640625, -1.2496337890625, -1.179290771484375, -1.10894775390625, -1.038604736328125, -0.96826171875, -0.897918701171875, -0.82757568359375, -0.757232666015625, -0.6868896484375, -0.616546630859375, -0.54620361328125, -0.475860595703125, -0.405517578125, -0.335174560546875, -0.26483154296875, -0.194488525390625, -0.1241455078125, -0.053802490234375, 0.01654052734375, 0.086883544921875, 0.1572265625, 0.227569580078125, 0.29791259765625, 0.368255615234375, 0.4385986328125, 0.508941650390625, 0.57928466796875, 0.649627685546875, 0.719970703125, 0.790313720703125, 0.86065673828125, 0.930999755859375, 1.0013427734375, 1.071685791015625, 1.14202880859375, 1.212371826171875, 1.28271484375, 1.353057861328125, 1.42340087890625, 1.493743896484375, 1.5640869140625, 1.634429931640625, 1.70477294921875, 1.775115966796875, 1.845458984375, 1.915802001953125, 1.98614501953125, 2.056488037109375, 2.1268310546875, 2.197174072265625, 2.26751708984375, 2.337860107421875, 2.408203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 12.0, 22.0, 21.0, 11.0, 35.0, 39.0, 44.0, 36.0, 43.0, 52.0, 48.0, 56.0, 66.0, 47.0, 52.0, 62.0, 43.0, 39.0, 44.0, 34.0, 35.0, 21.0, 27.0, 16.0, 11.0, 14.0, 6.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.353515625, -1.3142852783203125, -1.275054931640625, -1.2358245849609375, -1.19659423828125, -1.1573638916015625, -1.118133544921875, -1.0789031982421875, -1.0396728515625, -1.0004425048828125, -0.961212158203125, -0.9219818115234375, -0.88275146484375, -0.8435211181640625, -0.804290771484375, -0.7650604248046875, -0.725830078125, -0.6865997314453125, -0.647369384765625, -0.6081390380859375, -0.56890869140625, -0.5296783447265625, -0.490447998046875, -0.4512176513671875, -0.4119873046875, -0.3727569580078125, -0.333526611328125, -0.2942962646484375, -0.25506591796875, -0.2158355712890625, -0.176605224609375, -0.1373748779296875, -0.09814453125, -0.0589141845703125, -0.019683837890625, 0.0195465087890625, 0.05877685546875, 0.0980072021484375, 0.137237548828125, 0.1764678955078125, 0.2156982421875, 0.2549285888671875, 0.294158935546875, 0.3333892822265625, 0.37261962890625, 0.4118499755859375, 0.451080322265625, 0.4903106689453125, 0.529541015625, 0.5687713623046875, 0.608001708984375, 0.6472320556640625, 0.68646240234375, 0.7256927490234375, 0.764923095703125, 0.8041534423828125, 0.8433837890625, 0.8826141357421875, 0.921844482421875, 0.9610748291015625, 1.00030517578125, 1.0395355224609375, 1.078765869140625, 1.1179962158203125, 1.1572265625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 11.0, 11.0, 12.0, 17.0, 18.0, 24.0, 35.0, 32.0, 32.0, 41.0, 44.0, 48.0, 48.0, 51.0, 44.0, 46.0, 50.0, 33.0, 36.0, 38.0, 42.0, 38.0, 39.0, 31.0, 23.0, 22.0, 26.0, 11.0, 10.0, 11.0, 10.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-75.80357360839844, -73.64806365966797, -71.4925537109375, -69.33704376220703, -67.18153381347656, -65.0260238647461, -62.87051773071289, -60.71500778198242, -58.55949783325195, -56.403987884521484, -54.248477935791016, -52.09296798706055, -49.937461853027344, -47.781951904296875, -45.626441955566406, -43.47093200683594, -41.31542205810547, -39.159912109375, -37.00440216064453, -34.84889221191406, -32.693382263183594, -30.537874221801758, -28.382366180419922, -26.226856231689453, -24.071346282958984, -21.915836334228516, -19.760326385498047, -17.60481834411621, -15.449308395385742, -13.293798446655273, -11.138289451599121, -8.982780456542969, -6.827274322509766, -4.671764850616455, -2.5162553787231445, -0.360745906829834, 1.7947635650634766, 3.9502735137939453, 6.105782508850098, 8.26129150390625, 10.416801452636719, 12.572311401367188, 14.72782039642334, 16.883329391479492, 19.03883934020996, 21.19434928894043, 23.349857330322266, 25.505367279052734, 27.660877227783203, 29.816387176513672, 31.97189712524414, 34.12740707397461, 36.28291320800781, 38.43842315673828, 40.59393310546875, 42.74944305419922, 44.90495300292969, 47.060462951660156, 49.215972900390625, 51.371482849121094, 53.52699279785156, 55.68250274658203, 57.838008880615234, 59.9935188293457, 62.14902877807617]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 7.0, 13.0, 14.0, 10.0, 13.0, 16.0, 19.0, 20.0, 22.0, 26.0, 32.0, 31.0, 38.0, 37.0, 39.0, 37.0, 30.0, 49.0, 40.0, 45.0, 41.0, 43.0, 36.0, 33.0, 36.0, 27.0, 37.0, 30.0, 24.0, 20.0, 18.0, 22.0, 11.0, 16.0, 15.0, 2.0, 9.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.99536895751953, -54.92876434326172, -52.862159729003906, -50.795555114746094, -48.72895050048828, -46.66234588623047, -44.595741271972656, -42.529136657714844, -40.46253204345703, -38.39592742919922, -36.329322814941406, -34.262718200683594, -32.19611358642578, -30.12950897216797, -28.062902450561523, -25.99629783630371, -23.929691314697266, -21.863086700439453, -19.79648208618164, -17.729877471923828, -15.6632719039917, -13.596667289733887, -11.530061721801758, -9.463457107543945, -7.396852493286133, -5.33024787902832, -3.2636427879333496, -1.197037696838379, 0.8695669174194336, 2.936171531677246, 5.002777099609375, 7.0693817138671875, 9.135986328125, 11.202590942382812, 13.269195556640625, 15.335801124572754, 17.40240478515625, 19.469009399414062, 21.535615921020508, 23.60222053527832, 25.668825149536133, 27.735429763793945, 29.802034378051758, 31.868640899658203, 33.935245513916016, 36.00185012817383, 38.06845474243164, 40.13505935668945, 42.201663970947266, 44.26826858520508, 46.33487319946289, 48.4014778137207, 50.468082427978516, 52.53468704223633, 54.601295471191406, 56.66790008544922, 58.73450469970703, 60.801109313964844, 62.867713928222656, 64.93431854248047, 67.00092315673828, 69.0675277709961, 71.1341323852539, 73.20073699951172, 75.26734161376953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 14.0, 21.0, 14.0, 30.0, 44.0, 57.0, 98.0, 128.0, 182.0, 293.0, 411.0, 679.0, 972.0, 1577.0, 2398.0, 3848.0, 6403.0, 10704.0, 17835.0, 29680.0, 47745.0, 73195.0, 102486.0, 129782.0, 142976.0, 136751.0, 113332.0, 82471.0, 55658.0, 34748.0, 21023.0, 12751.0, 7532.0, 4548.0, 2908.0, 1751.0, 1160.0, 759.0, 483.0, 350.0, 241.0, 148.0, 108.0, 77.0, 60.0, 37.0, 26.0, 18.0, 12.0, 10.0, 4.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-68.6875, -66.5849609375, -64.482421875, -62.3798828125, -60.27734375, -58.1748046875, -56.072265625, -53.9697265625, -51.8671875, -49.7646484375, -47.662109375, -45.5595703125, -43.45703125, -41.3544921875, -39.251953125, -37.1494140625, -35.046875, -32.9443359375, -30.841796875, -28.7392578125, -26.63671875, -24.5341796875, -22.431640625, -20.3291015625, -18.2265625, -16.1240234375, -14.021484375, -11.9189453125, -9.81640625, -7.7138671875, -5.611328125, -3.5087890625, -1.40625, 0.6962890625, 2.798828125, 4.9013671875, 7.00390625, 9.1064453125, 11.208984375, 13.3115234375, 15.4140625, 17.5166015625, 19.619140625, 21.7216796875, 23.82421875, 25.9267578125, 28.029296875, 30.1318359375, 32.234375, 34.3369140625, 36.439453125, 38.5419921875, 40.64453125, 42.7470703125, 44.849609375, 46.9521484375, 49.0546875, 51.1572265625, 53.259765625, 55.3623046875, 57.46484375, 59.5673828125, 61.669921875, 63.7724609375, 65.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 5.0, 5.0, 4.0, 8.0, 5.0, 8.0, 14.0, 16.0, 15.0, 14.0, 11.0, 22.0, 23.0, 23.0, 24.0, 31.0, 37.0, 38.0, 37.0, 34.0, 42.0, 35.0, 52.0, 35.0, 47.0, 43.0, 35.0, 38.0, 30.0, 34.0, 31.0, 34.0, 27.0, 18.0, 25.0, 18.0, 19.0, 12.0, 8.0, 12.0, 7.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.625, -52.7490234375, -50.873046875, -48.9970703125, -47.12109375, -45.2451171875, -43.369140625, -41.4931640625, -39.6171875, -37.7412109375, -35.865234375, -33.9892578125, -32.11328125, -30.2373046875, -28.361328125, -26.4853515625, -24.609375, -22.7333984375, -20.857421875, -18.9814453125, -17.10546875, -15.2294921875, -13.353515625, -11.4775390625, -9.6015625, -7.7255859375, -5.849609375, -3.9736328125, -2.09765625, -0.2216796875, 1.654296875, 3.5302734375, 5.40625, 7.2822265625, 9.158203125, 11.0341796875, 12.91015625, 14.7861328125, 16.662109375, 18.5380859375, 20.4140625, 22.2900390625, 24.166015625, 26.0419921875, 27.91796875, 29.7939453125, 31.669921875, 33.5458984375, 35.421875, 37.2978515625, 39.173828125, 41.0498046875, 42.92578125, 44.8017578125, 46.677734375, 48.5537109375, 50.4296875, 52.3056640625, 54.181640625, 56.0576171875, 57.93359375, 59.8095703125, 61.685546875, 63.5615234375, 65.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 12.0, 19.0, 24.0, 56.0, 81.0, 115.0, 156.0, 259.0, 389.0, 579.0, 859.0, 1403.0, 2429.0, 3838.0, 6484.0, 11297.0, 20446.0, 35294.0, 60573.0, 95516.0, 135745.0, 163314.0, 160509.0, 129149.0, 88265.0, 55305.0, 32340.0, 18194.0, 10479.0, 6011.0, 3540.0, 2165.0, 1318.0, 820.0, 558.0, 322.0, 214.0, 150.0, 109.0, 67.0, 44.0, 30.0, 27.0, 17.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.625, -79.9521484375, -77.279296875, -74.6064453125, -71.93359375, -69.2607421875, -66.587890625, -63.9150390625, -61.2421875, -58.5693359375, -55.896484375, -53.2236328125, -50.55078125, -47.8779296875, -45.205078125, -42.5322265625, -39.859375, -37.1865234375, -34.513671875, -31.8408203125, -29.16796875, -26.4951171875, -23.822265625, -21.1494140625, -18.4765625, -15.8037109375, -13.130859375, -10.4580078125, -7.78515625, -5.1123046875, -2.439453125, 0.2333984375, 2.90625, 5.5791015625, 8.251953125, 10.9248046875, 13.59765625, 16.2705078125, 18.943359375, 21.6162109375, 24.2890625, 26.9619140625, 29.634765625, 32.3076171875, 34.98046875, 37.6533203125, 40.326171875, 42.9990234375, 45.671875, 48.3447265625, 51.017578125, 53.6904296875, 56.36328125, 59.0361328125, 61.708984375, 64.3818359375, 67.0546875, 69.7275390625, 72.400390625, 75.0732421875, 77.74609375, 80.4189453125, 83.091796875, 85.7646484375, 88.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 12.0, 15.0, 17.0, 18.0, 14.0, 21.0, 37.0, 27.0, 36.0, 32.0, 41.0, 49.0, 53.0, 45.0, 42.0, 45.0, 40.0, 46.0, 52.0, 44.0, 36.0, 44.0, 31.0, 32.0, 23.0, 17.0, 24.0, 18.0, 8.0, 12.0, 14.0, 16.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-43.5625, -42.216796875, -40.87109375, -39.525390625, -38.1796875, -36.833984375, -35.48828125, -34.142578125, -32.796875, -31.451171875, -30.10546875, -28.759765625, -27.4140625, -26.068359375, -24.72265625, -23.376953125, -22.03125, -20.685546875, -19.33984375, -17.994140625, -16.6484375, -15.302734375, -13.95703125, -12.611328125, -11.265625, -9.919921875, -8.57421875, -7.228515625, -5.8828125, -4.537109375, -3.19140625, -1.845703125, -0.5, 0.845703125, 2.19140625, 3.537109375, 4.8828125, 6.228515625, 7.57421875, 8.919921875, 10.265625, 11.611328125, 12.95703125, 14.302734375, 15.6484375, 16.994140625, 18.33984375, 19.685546875, 21.03125, 22.376953125, 23.72265625, 25.068359375, 26.4140625, 27.759765625, 29.10546875, 30.451171875, 31.796875, 33.142578125, 34.48828125, 35.833984375, 37.1796875, 38.525390625, 39.87109375, 41.216796875, 42.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 15.0, 20.0, 25.0, 35.0, 60.0, 90.0, 155.0, 266.0, 440.0, 766.0, 1254.0, 2036.0, 3736.0, 6529.0, 11717.0, 20416.0, 34799.0, 57247.0, 87455.0, 120736.0, 146029.0, 150679.0, 132084.0, 101420.0, 68222.0, 42752.0, 25298.0, 14590.0, 8432.0, 4807.0, 2667.0, 1525.0, 890.0, 541.0, 312.0, 169.0, 124.0, 69.0, 54.0, 32.0, 21.0, 12.0, 10.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.90625, -18.30029296875, -17.6943359375, -17.08837890625, -16.482421875, -15.87646484375, -15.2705078125, -14.66455078125, -14.05859375, -13.45263671875, -12.8466796875, -12.24072265625, -11.634765625, -11.02880859375, -10.4228515625, -9.81689453125, -9.2109375, -8.60498046875, -7.9990234375, -7.39306640625, -6.787109375, -6.18115234375, -5.5751953125, -4.96923828125, -4.36328125, -3.75732421875, -3.1513671875, -2.54541015625, -1.939453125, -1.33349609375, -0.7275390625, -0.12158203125, 0.484375, 1.09033203125, 1.6962890625, 2.30224609375, 2.908203125, 3.51416015625, 4.1201171875, 4.72607421875, 5.33203125, 5.93798828125, 6.5439453125, 7.14990234375, 7.755859375, 8.36181640625, 8.9677734375, 9.57373046875, 10.1796875, 10.78564453125, 11.3916015625, 11.99755859375, 12.603515625, 13.20947265625, 13.8154296875, 14.42138671875, 15.02734375, 15.63330078125, 16.2392578125, 16.84521484375, 17.451171875, 18.05712890625, 18.6630859375, 19.26904296875, 19.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 28.0, 20.0, 25.0, 32.0, 34.0, 37.0, 42.0, 49.0, 51.0, 51.0, 42.0, 63.0, 51.0, 45.0, 55.0, 41.0, 35.0, 35.0, 34.0, 34.0, 26.0, 29.0, 11.0, 21.0, 12.0, 14.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019254684448242188, -0.0018616467714309692, -0.0017978250980377197, -0.0017340034246444702, -0.0016701817512512207, -0.0016063600778579712, -0.0015425384044647217, -0.0014787167310714722, -0.0014148950576782227, -0.0013510733842849731, -0.0012872517108917236, -0.0012234300374984741, -0.0011596083641052246, -0.001095786690711975, -0.0010319650173187256, -0.0009681433439254761, -0.0009043216705322266, -0.000840499997138977, -0.0007766783237457275, -0.000712856650352478, -0.0006490349769592285, -0.000585213303565979, -0.0005213916301727295, -0.00045756995677948, -0.00039374828338623047, -0.00032992660999298096, -0.00026610493659973145, -0.00020228326320648193, -0.00013846158981323242, -7.463991641998291e-05, -1.0818243026733398e-05, 5.300343036651611e-05, 0.00011682510375976562, 0.00018064677715301514, 0.00024446845054626465, 0.00030829012393951416, 0.00037211179733276367, 0.0004359334707260132, 0.0004997551441192627, 0.0005635768175125122, 0.0006273984909057617, 0.0006912201642990112, 0.0007550418376922607, 0.0008188635110855103, 0.0008826851844787598, 0.0009465068578720093, 0.0010103285312652588, 0.0010741502046585083, 0.0011379718780517578, 0.0012017935514450073, 0.0012656152248382568, 0.0013294368982315063, 0.0013932585716247559, 0.0014570802450180054, 0.0015209019184112549, 0.0015847235918045044, 0.001648545265197754, 0.0017123669385910034, 0.001776188611984253, 0.0018400102853775024, 0.001903831958770752, 0.0019676536321640015, 0.002031475305557251, 0.0020952969789505005, 0.00215911865234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 34.0, 37.0, 41.0, 90.0, 118.0, 176.0, 264.0, 391.0, 599.0, 844.0, 1382.0, 1991.0, 3005.0, 4867.0, 7403.0, 11499.0, 17803.0, 27030.0, 40146.0, 57317.0, 79016.0, 100157.0, 116513.0, 122690.0, 114808.0, 97569.0, 76024.0, 54754.0, 37952.0, 25858.0, 16797.0, 11065.0, 7125.0, 4483.0, 2996.0, 1931.0, 1288.0, 836.0, 507.0, 380.0, 224.0, 165.0, 105.0, 76.0, 49.0, 39.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 9.0, 3.0, 1.0], "bins": [-16.25, -15.7490234375, -15.248046875, -14.7470703125, -14.24609375, -13.7451171875, -13.244140625, -12.7431640625, -12.2421875, -11.7412109375, -11.240234375, -10.7392578125, -10.23828125, -9.7373046875, -9.236328125, -8.7353515625, -8.234375, -7.7333984375, -7.232421875, -6.7314453125, -6.23046875, -5.7294921875, -5.228515625, -4.7275390625, -4.2265625, -3.7255859375, -3.224609375, -2.7236328125, -2.22265625, -1.7216796875, -1.220703125, -0.7197265625, -0.21875, 0.2822265625, 0.783203125, 1.2841796875, 1.78515625, 2.2861328125, 2.787109375, 3.2880859375, 3.7890625, 4.2900390625, 4.791015625, 5.2919921875, 5.79296875, 6.2939453125, 6.794921875, 7.2958984375, 7.796875, 8.2978515625, 8.798828125, 9.2998046875, 9.80078125, 10.3017578125, 10.802734375, 11.3037109375, 11.8046875, 12.3056640625, 12.806640625, 13.3076171875, 13.80859375, 14.3095703125, 14.810546875, 15.3115234375, 15.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 16.0, 15.0, 24.0, 16.0, 25.0, 20.0, 39.0, 42.0, 41.0, 41.0, 45.0, 60.0, 58.0, 48.0, 66.0, 53.0, 46.0, 36.0, 31.0, 38.0, 38.0, 38.0, 22.0, 24.0, 13.0, 16.0, 16.0, 6.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.24609375, -7.018798828125, -6.79150390625, -6.564208984375, -6.3369140625, -6.109619140625, -5.88232421875, -5.655029296875, -5.427734375, -5.200439453125, -4.97314453125, -4.745849609375, -4.5185546875, -4.291259765625, -4.06396484375, -3.836669921875, -3.609375, -3.382080078125, -3.15478515625, -2.927490234375, -2.7001953125, -2.472900390625, -2.24560546875, -2.018310546875, -1.791015625, -1.563720703125, -1.33642578125, -1.109130859375, -0.8818359375, -0.654541015625, -0.42724609375, -0.199951171875, 0.02734375, 0.254638671875, 0.48193359375, 0.709228515625, 0.9365234375, 1.163818359375, 1.39111328125, 1.618408203125, 1.845703125, 2.072998046875, 2.30029296875, 2.527587890625, 2.7548828125, 2.982177734375, 3.20947265625, 3.436767578125, 3.6640625, 3.891357421875, 4.11865234375, 4.345947265625, 4.5732421875, 4.800537109375, 5.02783203125, 5.255126953125, 5.482421875, 5.709716796875, 5.93701171875, 6.164306640625, 6.3916015625, 6.618896484375, 6.84619140625, 7.073486328125, 7.30078125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 9.0, 12.0, 12.0, 18.0, 20.0, 29.0, 33.0, 32.0, 41.0, 37.0, 45.0, 36.0, 39.0, 42.0, 33.0, 48.0, 44.0, 35.0, 45.0, 39.0, 42.0, 30.0, 36.0, 26.0, 31.0, 16.0, 22.0, 20.0, 18.0, 12.0, 12.0, 6.0, 14.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.189083099365234, -60.27553939819336, -58.361995697021484, -56.44845199584961, -54.534908294677734, -52.621360778808594, -50.70781707763672, -48.794273376464844, -46.88072967529297, -44.967185974121094, -43.05364227294922, -41.140098571777344, -39.22655487060547, -37.313011169433594, -35.39946746826172, -33.48591995239258, -31.572378158569336, -29.65883445739746, -27.745290756225586, -25.831745147705078, -23.918201446533203, -22.004657745361328, -20.091114044189453, -18.177570343017578, -16.264026641845703, -14.350482940673828, -12.436938285827637, -10.523394584655762, -8.60984992980957, -6.696306228637695, -4.78276252746582, -2.869217872619629, -0.9556732177734375, 0.9578708410263062, 2.87141489982605, 4.784958839416504, 6.698503017425537, 8.61204719543457, 10.525590896606445, 12.439135551452637, 14.352679252624512, 16.266223907470703, 18.179767608642578, 20.093311309814453, 22.006855010986328, 23.920398712158203, 25.833942413330078, 27.747488021850586, 29.66103172302246, 31.574575424194336, 33.488121032714844, 35.40166473388672, 37.315208435058594, 39.22875213623047, 41.142295837402344, 43.05583953857422, 44.969383239746094, 46.88292694091797, 48.796470642089844, 50.71001434326172, 52.623558044433594, 54.53710174560547, 56.450645446777344, 58.364192962646484, 60.27773666381836]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 28.0, 14.0, 15.0, 17.0, 21.0, 32.0, 37.0, 31.0, 25.0, 33.0, 27.0, 35.0, 42.0, 37.0, 33.0, 38.0, 43.0, 35.0, 47.0, 33.0, 27.0, 25.0, 30.0, 26.0, 33.0, 33.0, 23.0, 12.0, 18.0, 16.0, 7.0, 13.0, 8.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.026329040527344, -50.16587829589844, -48.30542755126953, -46.444976806640625, -44.584529876708984, -42.72407913208008, -40.86362838745117, -39.003177642822266, -37.142730712890625, -35.28227996826172, -33.42182922363281, -31.56138038635254, -29.700931549072266, -27.84048080444336, -25.980030059814453, -24.119579315185547, -22.25912857055664, -20.398677825927734, -18.53822898864746, -16.677778244018555, -14.817328453063965, -12.956878662109375, -11.096427917480469, -9.235978126525879, -7.375528335571289, -5.515078544616699, -3.654628276824951, -1.7941780090332031, 0.06627178192138672, 1.9267215728759766, 3.787172317504883, 5.647622108459473, 7.5080718994140625, 9.368521690368652, 11.228971481323242, 13.089422225952148, 14.949872016906738, 16.810321807861328, 18.670772552490234, 20.53122329711914, 22.391672134399414, 24.25212287902832, 26.112571716308594, 27.9730224609375, 29.833473205566406, 31.69392204284668, 33.55437469482422, 35.41482162475586, 37.275272369384766, 39.13572311401367, 40.99617385864258, 42.85662078857422, 44.717071533203125, 46.57752227783203, 48.43797302246094, 50.298423767089844, 52.15887451171875, 54.019325256347656, 55.87977600097656, 57.74022674560547, 59.60067367553711, 61.461124420166016, 63.32157516479492, 65.18202209472656, 67.04247283935547]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 11.0, 18.0, 28.0, 42.0, 76.0, 121.0, 200.0, 316.0, 589.0, 952.0, 1492.0, 2526.0, 4350.0, 7005.0, 11884.0, 19751.0, 32830.0, 53605.0, 87683.0, 139074.0, 214626.0, 316454.0, 430625.0, 526383.0, 562820.0, 518340.0, 417305.0, 301483.0, 203956.0, 130892.0, 81386.0, 49896.0, 30420.0, 18512.0, 11151.0, 6719.0, 4072.0, 2501.0, 1595.0, 911.0, 659.0, 373.0, 229.0, 146.0, 86.0, 72.0, 44.0, 24.0, 14.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-58.125, -56.3330078125, -54.541015625, -52.7490234375, -50.95703125, -49.1650390625, -47.373046875, -45.5810546875, -43.7890625, -41.9970703125, -40.205078125, -38.4130859375, -36.62109375, -34.8291015625, -33.037109375, -31.2451171875, -29.453125, -27.6611328125, -25.869140625, -24.0771484375, -22.28515625, -20.4931640625, -18.701171875, -16.9091796875, -15.1171875, -13.3251953125, -11.533203125, -9.7412109375, -7.94921875, -6.1572265625, -4.365234375, -2.5732421875, -0.78125, 1.0107421875, 2.802734375, 4.5947265625, 6.38671875, 8.1787109375, 9.970703125, 11.7626953125, 13.5546875, 15.3466796875, 17.138671875, 18.9306640625, 20.72265625, 22.5146484375, 24.306640625, 26.0986328125, 27.890625, 29.6826171875, 31.474609375, 33.2666015625, 35.05859375, 36.8505859375, 38.642578125, 40.4345703125, 42.2265625, 44.0185546875, 45.810546875, 47.6025390625, 49.39453125, 51.1865234375, 52.978515625, 54.7705078125, 56.5625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 7.0, 11.0, 15.0, 13.0, 18.0, 19.0, 16.0, 21.0, 30.0, 24.0, 34.0, 34.0, 34.0, 26.0, 30.0, 31.0, 46.0, 47.0, 45.0, 35.0, 45.0, 31.0, 36.0, 35.0, 23.0, 25.0, 38.0, 36.0, 23.0, 23.0, 22.0, 15.0, 12.0, 16.0, 12.0, 9.0, 7.0, 11.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.15576171875, -41.5302734375, -39.90478515625, -38.279296875, -36.65380859375, -35.0283203125, -33.40283203125, -31.77734375, -30.15185546875, -28.5263671875, -26.90087890625, -25.275390625, -23.64990234375, -22.0244140625, -20.39892578125, -18.7734375, -17.14794921875, -15.5224609375, -13.89697265625, -12.271484375, -10.64599609375, -9.0205078125, -7.39501953125, -5.76953125, -4.14404296875, -2.5185546875, -0.89306640625, 0.732421875, 2.35791015625, 3.9833984375, 5.60888671875, 7.234375, 8.85986328125, 10.4853515625, 12.11083984375, 13.736328125, 15.36181640625, 16.9873046875, 18.61279296875, 20.23828125, 21.86376953125, 23.4892578125, 25.11474609375, 26.740234375, 28.36572265625, 29.9912109375, 31.61669921875, 33.2421875, 34.86767578125, 36.4931640625, 38.11865234375, 39.744140625, 41.36962890625, 42.9951171875, 44.62060546875, 46.24609375, 47.87158203125, 49.4970703125, 51.12255859375, 52.748046875, 54.37353515625, 55.9990234375, 57.62451171875, 59.25]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 11.0, 33.0, 44.0, 100.0, 147.0, 256.0, 409.0, 626.0, 1168.0, 1943.0, 3359.0, 5957.0, 10396.0, 17840.0, 31373.0, 53585.0, 89492.0, 143184.0, 221088.0, 322262.0, 431006.0, 518071.0, 550668.0, 510450.0, 418899.0, 309558.0, 212385.0, 136791.0, 83564.0, 50257.0, 29121.0, 16935.0, 9979.0, 5594.0, 3229.0, 1856.0, 1100.0, 592.0, 392.0, 238.0, 120.0, 72.0, 44.0, 22.0, 13.0, 13.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-63.75, -61.84375, -59.9375, -58.03125, -56.125, -54.21875, -52.3125, -50.40625, -48.5, -46.59375, -44.6875, -42.78125, -40.875, -38.96875, -37.0625, -35.15625, -33.25, -31.34375, -29.4375, -27.53125, -25.625, -23.71875, -21.8125, -19.90625, -18.0, -16.09375, -14.1875, -12.28125, -10.375, -8.46875, -6.5625, -4.65625, -2.75, -0.84375, 1.0625, 2.96875, 4.875, 6.78125, 8.6875, 10.59375, 12.5, 14.40625, 16.3125, 18.21875, 20.125, 22.03125, 23.9375, 25.84375, 27.75, 29.65625, 31.5625, 33.46875, 35.375, 37.28125, 39.1875, 41.09375, 43.0, 44.90625, 46.8125, 48.71875, 50.625, 52.53125, 54.4375, 56.34375, 58.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 24.0, 27.0, 23.0, 42.0, 56.0, 82.0, 86.0, 119.0, 119.0, 140.0, 180.0, 174.0, 202.0, 220.0, 207.0, 214.0, 250.0, 230.0, 255.0, 214.0, 206.0, 167.0, 140.0, 129.0, 106.0, 94.0, 61.0, 64.0, 53.0, 41.0, 32.0, 21.0, 12.0, 19.0, 9.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.640625, -26.752197265625, -25.86376953125, -24.975341796875, -24.0869140625, -23.198486328125, -22.31005859375, -21.421630859375, -20.533203125, -19.644775390625, -18.75634765625, -17.867919921875, -16.9794921875, -16.091064453125, -15.20263671875, -14.314208984375, -13.42578125, -12.537353515625, -11.64892578125, -10.760498046875, -9.8720703125, -8.983642578125, -8.09521484375, -7.206787109375, -6.318359375, -5.429931640625, -4.54150390625, -3.653076171875, -2.7646484375, -1.876220703125, -0.98779296875, -0.099365234375, 0.7890625, 1.677490234375, 2.56591796875, 3.454345703125, 4.3427734375, 5.231201171875, 6.11962890625, 7.008056640625, 7.896484375, 8.784912109375, 9.67333984375, 10.561767578125, 11.4501953125, 12.338623046875, 13.22705078125, 14.115478515625, 15.00390625, 15.892333984375, 16.78076171875, 17.669189453125, 18.5576171875, 19.446044921875, 20.33447265625, 21.222900390625, 22.111328125, 22.999755859375, 23.88818359375, 24.776611328125, 25.6650390625, 26.553466796875, 27.44189453125, 28.330322265625, 29.21875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 7.0, 8.0, 14.0, 9.0, 17.0, 25.0, 24.0, 29.0, 32.0, 38.0, 41.0, 44.0, 45.0, 47.0, 34.0, 47.0, 38.0, 34.0, 48.0, 40.0, 50.0, 34.0, 34.0, 38.0, 26.0, 24.0, 29.0, 19.0, 14.0, 18.0, 11.0, 9.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.0414810180664, -62.051815032958984, -60.06214904785156, -58.072479248046875, -56.08281326293945, -54.09314727783203, -52.10348129272461, -50.11381530761719, -48.1241455078125, -46.13447952270508, -44.144813537597656, -42.15514373779297, -40.16547775268555, -38.175811767578125, -36.1861457824707, -34.19647979736328, -32.20681381225586, -30.217147827148438, -28.227479934692383, -26.23781394958496, -24.248146057128906, -22.258480072021484, -20.268814086914062, -18.27914810180664, -16.289480209350586, -14.299813270568848, -12.31014633178711, -10.320480346679688, -8.33081340789795, -6.341146469116211, -4.351480484008789, -2.361813545227051, -0.3721427917480469, 1.6175239086151123, 3.6071906089782715, 5.596857070922852, 7.58652400970459, 9.576190948486328, 11.56585693359375, 13.555523872375488, 15.545190811157227, 17.53485679626465, 19.524524688720703, 21.514190673828125, 23.503856658935547, 25.4935245513916, 27.483190536499023, 29.472858428955078, 31.4625244140625, 33.45219039916992, 35.441856384277344, 37.43152618408203, 39.42119216918945, 41.410858154296875, 43.4005241394043, 45.39019012451172, 47.379859924316406, 49.36952590942383, 51.35919189453125, 53.34886169433594, 55.33852767944336, 57.32819366455078, 59.3178596496582, 61.307525634765625, 63.29719161987305]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 13.0, 13.0, 21.0, 21.0, 20.0, 30.0, 29.0, 30.0, 43.0, 33.0, 43.0, 34.0, 37.0, 35.0, 47.0, 42.0, 44.0, 56.0, 39.0, 28.0, 33.0, 35.0, 31.0, 32.0, 21.0, 18.0, 27.0, 17.0, 18.0, 12.0, 16.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.1981086730957, -50.17898178100586, -48.159854888916016, -46.14072799682617, -44.12159729003906, -42.10247039794922, -40.083343505859375, -38.06421661376953, -36.04508972167969, -34.025962829589844, -32.0068359375, -29.987707138061523, -27.96858024597168, -25.949453353881836, -23.93032455444336, -21.911197662353516, -19.892070770263672, -17.872943878173828, -15.853816032409668, -13.834688186645508, -11.815561294555664, -9.79643440246582, -7.77730655670166, -5.7581787109375, -3.7390518188476562, -1.7199244499206543, 0.29920291900634766, 2.3183302879333496, 4.337457656860352, 6.356584548950195, 8.375712394714355, 10.394840240478516, 12.413963317871094, 14.433090209960938, 16.45221710205078, 18.471345901489258, 20.4904727935791, 22.509599685668945, 24.528728485107422, 26.547855377197266, 28.56698226928711, 30.586109161376953, 32.6052360534668, 34.62436294555664, 36.64349365234375, 38.662620544433594, 40.68174743652344, 42.70087432861328, 44.720001220703125, 46.73912811279297, 48.75825500488281, 50.777381896972656, 52.7965087890625, 54.815635681152344, 56.83476638793945, 58.8538932800293, 60.87302017211914, 62.892147064208984, 64.9112777709961, 66.93040466308594, 68.94953155517578, 70.96865844726562, 72.98778533935547, 75.00691223144531, 77.02603912353516]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 18.0, 26.0, 32.0, 62.0, 99.0, 123.0, 190.0, 332.0, 512.0, 805.0, 1310.0, 1936.0, 2922.0, 4618.0, 6983.0, 10573.0, 15849.0, 23310.0, 33445.0, 46418.0, 61905.0, 77733.0, 92309.0, 101624.0, 104860.0, 100458.0, 89157.0, 74347.0, 58061.0, 43335.0, 31382.0, 21663.0, 14597.0, 9589.0, 6322.0, 4161.0, 2599.0, 1713.0, 1105.0, 701.0, 478.0, 330.0, 185.0, 125.0, 98.0, 55.0, 38.0, 19.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-28.078125, -27.18359375, -26.2890625, -25.39453125, -24.5, -23.60546875, -22.7109375, -21.81640625, -20.921875, -20.02734375, -19.1328125, -18.23828125, -17.34375, -16.44921875, -15.5546875, -14.66015625, -13.765625, -12.87109375, -11.9765625, -11.08203125, -10.1875, -9.29296875, -8.3984375, -7.50390625, -6.609375, -5.71484375, -4.8203125, -3.92578125, -3.03125, -2.13671875, -1.2421875, -0.34765625, 0.546875, 1.44140625, 2.3359375, 3.23046875, 4.125, 5.01953125, 5.9140625, 6.80859375, 7.703125, 8.59765625, 9.4921875, 10.38671875, 11.28125, 12.17578125, 13.0703125, 13.96484375, 14.859375, 15.75390625, 16.6484375, 17.54296875, 18.4375, 19.33203125, 20.2265625, 21.12109375, 22.015625, 22.91015625, 23.8046875, 24.69921875, 25.59375, 26.48828125, 27.3828125, 28.27734375, 29.171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 15.0, 22.0, 21.0, 18.0, 30.0, 31.0, 30.0, 43.0, 35.0, 39.0, 33.0, 41.0, 33.0, 43.0, 42.0, 47.0, 54.0, 41.0, 27.0, 31.0, 34.0, 32.0, 34.0, 23.0, 19.0, 23.0, 19.0, 14.0, 15.0, 14.0, 11.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.75, -50.712890625, -48.67578125, -46.638671875, -44.6015625, -42.564453125, -40.52734375, -38.490234375, -36.453125, -34.416015625, -32.37890625, -30.341796875, -28.3046875, -26.267578125, -24.23046875, -22.193359375, -20.15625, -18.119140625, -16.08203125, -14.044921875, -12.0078125, -9.970703125, -7.93359375, -5.896484375, -3.859375, -1.822265625, 0.21484375, 2.251953125, 4.2890625, 6.326171875, 8.36328125, 10.400390625, 12.4375, 14.474609375, 16.51171875, 18.548828125, 20.5859375, 22.623046875, 24.66015625, 26.697265625, 28.734375, 30.771484375, 32.80859375, 34.845703125, 36.8828125, 38.919921875, 40.95703125, 42.994140625, 45.03125, 47.068359375, 49.10546875, 51.142578125, 53.1796875, 55.216796875, 57.25390625, 59.291015625, 61.328125, 63.365234375, 65.40234375, 67.439453125, 69.4765625, 71.513671875, 73.55078125, 75.587890625, 77.625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 13.0, 8.0, 11.0, 23.0, 42.0, 40.0, 66.0, 96.0, 123.0, 178.0, 230.0, 337.0, 462.0, 608.0, 912.0, 1204.0, 1691.0, 2282.0, 3206.0, 4328.0, 5954.0, 8307.0, 11384.0, 15689.0, 22526.0, 64395.0, 673006.0, 142752.0, 25810.0, 17002.0, 12508.0, 9026.0, 6700.0, 4899.0, 3575.0, 2543.0, 1775.0, 1353.0, 950.0, 754.0, 491.0, 381.0, 250.0, 199.0, 146.0, 99.0, 81.0, 47.0, 37.0, 15.0, 13.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0], "bins": [-47.9375, -46.46875, -45.0, -43.53125, -42.0625, -40.59375, -39.125, -37.65625, -36.1875, -34.71875, -33.25, -31.78125, -30.3125, -28.84375, -27.375, -25.90625, -24.4375, -22.96875, -21.5, -20.03125, -18.5625, -17.09375, -15.625, -14.15625, -12.6875, -11.21875, -9.75, -8.28125, -6.8125, -5.34375, -3.875, -2.40625, -0.9375, 0.53125, 2.0, 3.46875, 4.9375, 6.40625, 7.875, 9.34375, 10.8125, 12.28125, 13.75, 15.21875, 16.6875, 18.15625, 19.625, 21.09375, 22.5625, 24.03125, 25.5, 26.96875, 28.4375, 29.90625, 31.375, 32.84375, 34.3125, 35.78125, 37.25, 38.71875, 40.1875, 41.65625, 43.125, 44.59375, 46.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 3.0, 11.0, 7.0, 7.0, 18.0, 13.0, 20.0, 16.0, 16.0, 18.0, 31.0, 39.0, 37.0, 42.0, 43.0, 43.0, 49.0, 43.0, 63.0, 36.0, 46.0, 41.0, 48.0, 37.0, 27.0, 31.0, 38.0, 31.0, 24.0, 22.0, 17.0, 19.0, 18.0, 10.0, 9.0, 3.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.1962890625, -40.611328125, -39.0263671875, -37.44140625, -35.8564453125, -34.271484375, -32.6865234375, -31.1015625, -29.5166015625, -27.931640625, -26.3466796875, -24.76171875, -23.1767578125, -21.591796875, -20.0068359375, -18.421875, -16.8369140625, -15.251953125, -13.6669921875, -12.08203125, -10.4970703125, -8.912109375, -7.3271484375, -5.7421875, -4.1572265625, -2.572265625, -0.9873046875, 0.59765625, 2.1826171875, 3.767578125, 5.3525390625, 6.9375, 8.5224609375, 10.107421875, 11.6923828125, 13.27734375, 14.8623046875, 16.447265625, 18.0322265625, 19.6171875, 21.2021484375, 22.787109375, 24.3720703125, 25.95703125, 27.5419921875, 29.126953125, 30.7119140625, 32.296875, 33.8818359375, 35.466796875, 37.0517578125, 38.63671875, 40.2216796875, 41.806640625, 43.3916015625, 44.9765625, 46.5615234375, 48.146484375, 49.7314453125, 51.31640625, 52.9013671875, 54.486328125, 56.0712890625, 57.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 20.0, 16.0, 22.0, 27.0, 45.0, 47.0, 65.0, 80.0, 110.0, 145.0, 194.0, 284.0, 369.0, 591.0, 705.0, 1040.0, 1513.0, 2240.0, 3047.0, 4776.0, 6969.0, 10614.0, 16690.0, 30278.0, 148299.0, 679154.0, 72873.0, 24596.0, 14626.0, 9452.0, 6087.0, 4114.0, 2833.0, 1871.0, 1361.0, 913.0, 658.0, 480.0, 338.0, 256.0, 193.0, 132.0, 124.0, 83.0, 52.0, 44.0, 31.0, 24.0, 12.0, 22.0, 5.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0], "bins": [-4.98046875, -4.8265380859375, -4.672607421875, -4.5186767578125, -4.36474609375, -4.2108154296875, -4.056884765625, -3.9029541015625, -3.7490234375, -3.5950927734375, -3.441162109375, -3.2872314453125, -3.13330078125, -2.9793701171875, -2.825439453125, -2.6715087890625, -2.517578125, -2.3636474609375, -2.209716796875, -2.0557861328125, -1.90185546875, -1.7479248046875, -1.593994140625, -1.4400634765625, -1.2861328125, -1.1322021484375, -0.978271484375, -0.8243408203125, -0.67041015625, -0.5164794921875, -0.362548828125, -0.2086181640625, -0.0546875, 0.0992431640625, 0.253173828125, 0.4071044921875, 0.56103515625, 0.7149658203125, 0.868896484375, 1.0228271484375, 1.1767578125, 1.3306884765625, 1.484619140625, 1.6385498046875, 1.79248046875, 1.9464111328125, 2.100341796875, 2.2542724609375, 2.408203125, 2.5621337890625, 2.716064453125, 2.8699951171875, 3.02392578125, 3.1778564453125, 3.331787109375, 3.4857177734375, 3.6396484375, 3.7935791015625, 3.947509765625, 4.1014404296875, 4.25537109375, 4.4093017578125, 4.563232421875, 4.7171630859375, 4.87109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 14.0, 7.0, 15.0, 16.0, 27.0, 29.0, 19.0, 29.0, 28.0, 38.0, 40.0, 42.0, 47.0, 44.0, 42.0, 43.0, 52.0, 46.0, 53.0, 41.0, 40.0, 41.0, 25.0, 26.0, 21.0, 24.0, 22.0, 17.0, 9.0, 11.0, 11.0, 4.0, 6.0, 10.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011510848999023438, -0.0011145174503326416, -0.0010779500007629395, -0.0010413825511932373, -0.0010048151016235352, -0.000968247652053833, -0.0009316802024841309, -0.0008951127529144287, -0.0008585453033447266, -0.0008219778537750244, -0.0007854104042053223, -0.0007488429546356201, -0.000712275505065918, -0.0006757080554962158, -0.0006391406059265137, -0.0006025731563568115, -0.0005660057067871094, -0.0005294382572174072, -0.0004928708076477051, -0.00045630335807800293, -0.0004197359085083008, -0.00038316845893859863, -0.0003466010093688965, -0.00031003355979919434, -0.0002734661102294922, -0.00023689866065979004, -0.0002003312110900879, -0.00016376376152038574, -0.0001271963119506836, -9.062886238098145e-05, -5.40614128112793e-05, -1.749396324157715e-05, 1.9073486328125e-05, 5.564093589782715e-05, 9.22083854675293e-05, 0.00012877583503723145, 0.0001653432846069336, 0.00020191073417663574, 0.0002384781837463379, 0.00027504563331604004, 0.0003116130828857422, 0.00034818053245544434, 0.0003847479820251465, 0.00042131543159484863, 0.0004578828811645508, 0.0004944503307342529, 0.0005310177803039551, 0.0005675852298736572, 0.0006041526794433594, 0.0006407201290130615, 0.0006772875785827637, 0.0007138550281524658, 0.000750422477722168, 0.0007869899272918701, 0.0008235573768615723, 0.0008601248264312744, 0.0008966922760009766, 0.0009332597255706787, 0.0009698271751403809, 0.001006394624710083, 0.0010429620742797852, 0.0010795295238494873, 0.0011160969734191895, 0.0011526644229888916, 0.0011892318725585938]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 9.0, 6.0, 12.0, 17.0, 31.0, 42.0, 61.0, 82.0, 158.0, 176.0, 338.0, 453.0, 696.0, 993.0, 1501.0, 2310.0, 3416.0, 5375.0, 8284.0, 12780.0, 19713.0, 30933.0, 46364.0, 68397.0, 93987.0, 119371.0, 134051.0, 129967.0, 111039.0, 83812.0, 59623.0, 40182.0, 26158.0, 16721.0, 10956.0, 7068.0, 4629.0, 2926.0, 1983.0, 1275.0, 918.0, 592.0, 380.0, 268.0, 178.0, 111.0, 65.0, 62.0, 35.0, 16.0, 15.0, 11.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-2.68359375, -2.5992431640625, -2.514892578125, -2.4305419921875, -2.34619140625, -2.2618408203125, -2.177490234375, -2.0931396484375, -2.0087890625, -1.9244384765625, -1.840087890625, -1.7557373046875, -1.67138671875, -1.5870361328125, -1.502685546875, -1.4183349609375, -1.333984375, -1.2496337890625, -1.165283203125, -1.0809326171875, -0.99658203125, -0.9122314453125, -0.827880859375, -0.7435302734375, -0.6591796875, -0.5748291015625, -0.490478515625, -0.4061279296875, -0.32177734375, -0.2374267578125, -0.153076171875, -0.0687255859375, 0.015625, 0.0999755859375, 0.184326171875, 0.2686767578125, 0.35302734375, 0.4373779296875, 0.521728515625, 0.6060791015625, 0.6904296875, 0.7747802734375, 0.859130859375, 0.9434814453125, 1.02783203125, 1.1121826171875, 1.196533203125, 1.2808837890625, 1.365234375, 1.4495849609375, 1.533935546875, 1.6182861328125, 1.70263671875, 1.7869873046875, 1.871337890625, 1.9556884765625, 2.0400390625, 2.1243896484375, 2.208740234375, 2.2930908203125, 2.37744140625, 2.4617919921875, 2.546142578125, 2.6304931640625, 2.71484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 2.0, 7.0, 3.0, 21.0, 13.0, 12.0, 23.0, 19.0, 30.0, 29.0, 36.0, 43.0, 41.0, 49.0, 43.0, 49.0, 56.0, 49.0, 54.0, 59.0, 44.0, 54.0, 42.0, 35.0, 38.0, 20.0, 14.0, 21.0, 15.0, 16.0, 5.0, 13.0, 11.0, 4.0, 10.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0448760986328125, -1.011627197265625, -0.9783782958984375, -0.94512939453125, -0.9118804931640625, -0.878631591796875, -0.8453826904296875, -0.8121337890625, -0.7788848876953125, -0.745635986328125, -0.7123870849609375, -0.67913818359375, -0.6458892822265625, -0.612640380859375, -0.5793914794921875, -0.546142578125, -0.5128936767578125, -0.479644775390625, -0.4463958740234375, -0.41314697265625, -0.3798980712890625, -0.346649169921875, -0.3134002685546875, -0.2801513671875, -0.2469024658203125, -0.213653564453125, -0.1804046630859375, -0.14715576171875, -0.1139068603515625, -0.080657958984375, -0.0474090576171875, -0.01416015625, 0.0190887451171875, 0.052337646484375, 0.0855865478515625, 0.11883544921875, 0.1520843505859375, 0.185333251953125, 0.2185821533203125, 0.2518310546875, 0.2850799560546875, 0.318328857421875, 0.3515777587890625, 0.38482666015625, 0.4180755615234375, 0.451324462890625, 0.4845733642578125, 0.517822265625, 0.5510711669921875, 0.584320068359375, 0.6175689697265625, 0.65081787109375, 0.6840667724609375, 0.717315673828125, 0.7505645751953125, 0.7838134765625, 0.8170623779296875, 0.850311279296875, 0.8835601806640625, 0.91680908203125, 0.9500579833984375, 0.983306884765625, 1.0165557861328125, 1.0498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 14.0, 13.0, 22.0, 16.0, 27.0, 34.0, 44.0, 25.0, 27.0, 46.0, 45.0, 53.0, 58.0, 55.0, 48.0, 45.0, 46.0, 37.0, 39.0, 51.0, 36.0, 39.0, 31.0, 18.0, 12.0, 24.0, 17.0, 13.0, 12.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.9545669555664, -74.69002532958984, -72.42549133300781, -70.16094970703125, -67.89641571044922, -65.63187408447266, -63.36733627319336, -61.10279846191406, -58.838260650634766, -56.57372283935547, -54.30918502807617, -52.044647216796875, -49.78010559082031, -47.51557159423828, -45.25102996826172, -42.98649215698242, -40.721954345703125, -38.45741653442383, -36.19287872314453, -33.928340911865234, -31.663801193237305, -29.399263381958008, -27.134723663330078, -24.87018585205078, -22.605648040771484, -20.341110229492188, -18.07657241821289, -15.812032699584961, -13.547494888305664, -11.282957077026367, -9.018418312072754, -6.753879547119141, -4.4893341064453125, -2.2247958183288574, 0.039742469787597656, 2.3042807579040527, 4.568819046020508, 6.833356857299805, 9.097895622253418, 11.362434387207031, 13.626972198486328, 15.891510009765625, 18.156047821044922, 20.42058753967285, 22.68512535095215, 24.949663162231445, 27.214202880859375, 29.478740692138672, 31.74327850341797, 34.007816314697266, 36.27235412597656, 38.53689193725586, 40.801429748535156, 43.06597137451172, 45.330509185791016, 47.59504699707031, 49.85958480834961, 52.124122619628906, 54.3886604309082, 56.6531982421875, 58.91773986816406, 61.182273864746094, 63.446815490722656, 65.71134948730469, 67.97589111328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 10.0, 11.0, 13.0, 20.0, 12.0, 27.0, 18.0, 29.0, 23.0, 34.0, 39.0, 39.0, 33.0, 43.0, 34.0, 31.0, 44.0, 45.0, 44.0, 53.0, 47.0, 34.0, 28.0, 35.0, 37.0, 27.0, 26.0, 22.0, 20.0, 25.0, 15.0, 14.0, 14.0, 9.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.366737365722656, -52.296630859375, -50.22652816772461, -48.15642166137695, -46.08631896972656, -44.016212463378906, -41.94610595703125, -39.875999450683594, -37.8058967590332, -35.73579025268555, -33.665687561035156, -31.5955810546875, -29.525476455688477, -27.455371856689453, -25.385265350341797, -23.315160751342773, -21.24505615234375, -19.174951553344727, -17.104846954345703, -15.034740447998047, -12.964635848999023, -10.89453125, -8.82442569732666, -6.75432014465332, -4.684215545654297, -2.6141104698181152, -0.5440053939819336, 1.526099681854248, 3.5962047576904297, 5.666309356689453, 7.736414909362793, 9.806520462036133, 11.876617431640625, 13.946722030639648, 16.016826629638672, 18.086933135986328, 20.15703773498535, 22.227142333984375, 24.29724884033203, 26.367353439331055, 28.437458038330078, 30.5075626373291, 32.577667236328125, 34.64777374267578, 36.71788024902344, 38.78798294067383, 40.858089447021484, 42.928192138671875, 44.99829864501953, 47.06840515136719, 49.13850784301758, 51.208614349365234, 53.278717041015625, 55.34882354736328, 57.41893005371094, 59.489036560058594, 61.559139251708984, 63.62924575805664, 65.69934844970703, 67.76945495605469, 69.83956146240234, 71.90966796875, 73.97976684570312, 76.04987335205078, 78.11997985839844]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 30.0, 54.0, 54.0, 92.0, 157.0, 224.0, 417.0, 633.0, 1040.0, 1811.0, 3028.0, 4995.0, 8713.0, 14132.0, 23245.0, 36536.0, 54820.0, 78354.0, 100563.0, 119748.0, 127566.0, 122210.0, 104890.0, 82340.0, 58774.0, 39752.0, 25528.0, 15418.0, 9606.0, 5499.0, 3240.0, 1958.0, 1195.0, 739.0, 464.0, 268.0, 164.0, 106.0, 66.0, 39.0, 21.0, 16.0, 12.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.21875, -51.42041015625, -49.6220703125, -47.82373046875, -46.025390625, -44.22705078125, -42.4287109375, -40.63037109375, -38.83203125, -37.03369140625, -35.2353515625, -33.43701171875, -31.638671875, -29.84033203125, -28.0419921875, -26.24365234375, -24.4453125, -22.64697265625, -20.8486328125, -19.05029296875, -17.251953125, -15.45361328125, -13.6552734375, -11.85693359375, -10.05859375, -8.26025390625, -6.4619140625, -4.66357421875, -2.865234375, -1.06689453125, 0.7314453125, 2.52978515625, 4.328125, 6.12646484375, 7.9248046875, 9.72314453125, 11.521484375, 13.31982421875, 15.1181640625, 16.91650390625, 18.71484375, 20.51318359375, 22.3115234375, 24.10986328125, 25.908203125, 27.70654296875, 29.5048828125, 31.30322265625, 33.1015625, 34.89990234375, 36.6982421875, 38.49658203125, 40.294921875, 42.09326171875, 43.8916015625, 45.68994140625, 47.48828125, 49.28662109375, 51.0849609375, 52.88330078125, 54.681640625, 56.47998046875, 58.2783203125, 60.07666015625, 61.875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 10.0, 12.0, 17.0, 12.0, 20.0, 20.0, 28.0, 28.0, 24.0, 39.0, 40.0, 43.0, 37.0, 39.0, 42.0, 41.0, 45.0, 38.0, 53.0, 48.0, 42.0, 35.0, 26.0, 32.0, 42.0, 22.0, 19.0, 27.0, 23.0, 17.0, 14.0, 9.0, 17.0, 3.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.58349609375, -49.5732421875, -47.56298828125, -45.552734375, -43.54248046875, -41.5322265625, -39.52197265625, -37.51171875, -35.50146484375, -33.4912109375, -31.48095703125, -29.470703125, -27.46044921875, -25.4501953125, -23.43994140625, -21.4296875, -19.41943359375, -17.4091796875, -15.39892578125, -13.388671875, -11.37841796875, -9.3681640625, -7.35791015625, -5.34765625, -3.33740234375, -1.3271484375, 0.68310546875, 2.693359375, 4.70361328125, 6.7138671875, 8.72412109375, 10.734375, 12.74462890625, 14.7548828125, 16.76513671875, 18.775390625, 20.78564453125, 22.7958984375, 24.80615234375, 26.81640625, 28.82666015625, 30.8369140625, 32.84716796875, 34.857421875, 36.86767578125, 38.8779296875, 40.88818359375, 42.8984375, 44.90869140625, 46.9189453125, 48.92919921875, 50.939453125, 52.94970703125, 54.9599609375, 56.97021484375, 58.98046875, 60.99072265625, 63.0009765625, 65.01123046875, 67.021484375, 69.03173828125, 71.0419921875, 73.05224609375, 75.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 20.0, 15.0, 28.0, 50.0, 58.0, 95.0, 175.0, 232.0, 394.0, 696.0, 1147.0, 1897.0, 3335.0, 5858.0, 10277.0, 17876.0, 30313.0, 49846.0, 76312.0, 106124.0, 132568.0, 144737.0, 136808.0, 112506.0, 82177.0, 54129.0, 33830.0, 19925.0, 11495.0, 6673.0, 3649.0, 2164.0, 1221.0, 720.0, 430.0, 254.0, 165.0, 137.0, 72.0, 46.0, 30.0, 15.0, 15.0, 11.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0], "bins": [-70.5625, -68.46240234375, -66.3623046875, -64.26220703125, -62.162109375, -60.06201171875, -57.9619140625, -55.86181640625, -53.76171875, -51.66162109375, -49.5615234375, -47.46142578125, -45.361328125, -43.26123046875, -41.1611328125, -39.06103515625, -36.9609375, -34.86083984375, -32.7607421875, -30.66064453125, -28.560546875, -26.46044921875, -24.3603515625, -22.26025390625, -20.16015625, -18.06005859375, -15.9599609375, -13.85986328125, -11.759765625, -9.65966796875, -7.5595703125, -5.45947265625, -3.359375, -1.25927734375, 0.8408203125, 2.94091796875, 5.041015625, 7.14111328125, 9.2412109375, 11.34130859375, 13.44140625, 15.54150390625, 17.6416015625, 19.74169921875, 21.841796875, 23.94189453125, 26.0419921875, 28.14208984375, 30.2421875, 32.34228515625, 34.4423828125, 36.54248046875, 38.642578125, 40.74267578125, 42.8427734375, 44.94287109375, 47.04296875, 49.14306640625, 51.2431640625, 53.34326171875, 55.443359375, 57.54345703125, 59.6435546875, 61.74365234375, 63.84375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 16.0, 17.0, 15.0, 22.0, 17.0, 24.0, 33.0, 29.0, 29.0, 35.0, 25.0, 44.0, 52.0, 46.0, 48.0, 48.0, 63.0, 37.0, 40.0, 34.0, 33.0, 36.0, 37.0, 29.0, 17.0, 21.0, 25.0, 24.0, 11.0, 18.0, 8.0, 9.0, 5.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-44.625, -43.2900390625, -41.955078125, -40.6201171875, -39.28515625, -37.9501953125, -36.615234375, -35.2802734375, -33.9453125, -32.6103515625, -31.275390625, -29.9404296875, -28.60546875, -27.2705078125, -25.935546875, -24.6005859375, -23.265625, -21.9306640625, -20.595703125, -19.2607421875, -17.92578125, -16.5908203125, -15.255859375, -13.9208984375, -12.5859375, -11.2509765625, -9.916015625, -8.5810546875, -7.24609375, -5.9111328125, -4.576171875, -3.2412109375, -1.90625, -0.5712890625, 0.763671875, 2.0986328125, 3.43359375, 4.7685546875, 6.103515625, 7.4384765625, 8.7734375, 10.1083984375, 11.443359375, 12.7783203125, 14.11328125, 15.4482421875, 16.783203125, 18.1181640625, 19.453125, 20.7880859375, 22.123046875, 23.4580078125, 24.79296875, 26.1279296875, 27.462890625, 28.7978515625, 30.1328125, 31.4677734375, 32.802734375, 34.1376953125, 35.47265625, 36.8076171875, 38.142578125, 39.4775390625, 40.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 21.0, 21.0, 33.0, 69.0, 89.0, 150.0, 244.0, 399.0, 649.0, 997.0, 1658.0, 3078.0, 5311.0, 9758.0, 18873.0, 36113.0, 66712.0, 116137.0, 167339.0, 191749.0, 168234.0, 115608.0, 67664.0, 36050.0, 18911.0, 9883.0, 5299.0, 3039.0, 1727.0, 1047.0, 603.0, 379.0, 233.0, 164.0, 90.0, 75.0, 45.0, 26.0, 21.0, 21.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.711181640625, -23.84423828125, -22.977294921875, -22.1103515625, -21.243408203125, -20.37646484375, -19.509521484375, -18.642578125, -17.775634765625, -16.90869140625, -16.041748046875, -15.1748046875, -14.307861328125, -13.44091796875, -12.573974609375, -11.70703125, -10.840087890625, -9.97314453125, -9.106201171875, -8.2392578125, -7.372314453125, -6.50537109375, -5.638427734375, -4.771484375, -3.904541015625, -3.03759765625, -2.170654296875, -1.3037109375, -0.436767578125, 0.43017578125, 1.297119140625, 2.1640625, 3.031005859375, 3.89794921875, 4.764892578125, 5.6318359375, 6.498779296875, 7.36572265625, 8.232666015625, 9.099609375, 9.966552734375, 10.83349609375, 11.700439453125, 12.5673828125, 13.434326171875, 14.30126953125, 15.168212890625, 16.03515625, 16.902099609375, 17.76904296875, 18.635986328125, 19.5029296875, 20.369873046875, 21.23681640625, 22.103759765625, 22.970703125, 23.837646484375, 24.70458984375, 25.571533203125, 26.4384765625, 27.305419921875, 28.17236328125, 29.039306640625, 29.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 9.0, 5.0, 22.0, 17.0, 14.0, 22.0, 29.0, 27.0, 34.0, 34.0, 50.0, 35.0, 54.0, 51.0, 64.0, 55.0, 52.0, 50.0, 56.0, 43.0, 39.0, 33.0, 26.0, 24.0, 32.0, 21.0, 17.0, 12.0, 10.0, 8.0, 10.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0024166107177734375, -0.0023413002490997314, -0.0022659897804260254, -0.0021906793117523193, -0.0021153688430786133, -0.0020400583744049072, -0.001964747905731201, -0.0018894374370574951, -0.001814126968383789, -0.001738816499710083, -0.001663506031036377, -0.001588195562362671, -0.0015128850936889648, -0.0014375746250152588, -0.0013622641563415527, -0.0012869536876678467, -0.0012116432189941406, -0.0011363327503204346, -0.0010610222816467285, -0.0009857118129730225, -0.0009104013442993164, -0.0008350908756256104, -0.0007597804069519043, -0.0006844699382781982, -0.0006091594696044922, -0.0005338490009307861, -0.0004585385322570801, -0.000383228063583374, -0.00030791759490966797, -0.00023260712623596191, -0.00015729665756225586, -8.19861888885498e-05, -6.67572021484375e-06, 6.86347484588623e-05, 0.00014394521713256836, 0.00021925568580627441, 0.00029456615447998047, 0.0003698766231536865, 0.0004451870918273926, 0.0005204975605010986, 0.0005958080291748047, 0.0006711184978485107, 0.0007464289665222168, 0.0008217394351959229, 0.0008970499038696289, 0.000972360372543335, 0.001047670841217041, 0.001122981309890747, 0.0011982917785644531, 0.0012736022472381592, 0.0013489127159118652, 0.0014242231845855713, 0.0014995336532592773, 0.0015748441219329834, 0.0016501545906066895, 0.0017254650592803955, 0.0018007755279541016, 0.0018760859966278076, 0.0019513964653015137, 0.0020267069339752197, 0.0021020174026489258, 0.002177327871322632, 0.002252638339996338, 0.002327948808670044, 0.00240325927734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 9.0, 8.0, 13.0, 21.0, 33.0, 44.0, 88.0, 134.0, 213.0, 312.0, 465.0, 740.0, 1141.0, 1815.0, 2802.0, 4334.0, 6985.0, 10980.0, 17648.0, 27088.0, 41986.0, 61827.0, 85937.0, 110041.0, 127232.0, 129828.0, 117323.0, 95160.0, 69609.0, 47287.0, 31578.0, 20409.0, 12921.0, 8158.0, 5285.0, 3249.0, 2050.0, 1320.0, 874.0, 577.0, 377.0, 220.0, 138.0, 102.0, 70.0, 51.0, 24.0, 20.0, 14.0, 10.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.6435546875, -16.052734375, -15.4619140625, -14.87109375, -14.2802734375, -13.689453125, -13.0986328125, -12.5078125, -11.9169921875, -11.326171875, -10.7353515625, -10.14453125, -9.5537109375, -8.962890625, -8.3720703125, -7.78125, -7.1904296875, -6.599609375, -6.0087890625, -5.41796875, -4.8271484375, -4.236328125, -3.6455078125, -3.0546875, -2.4638671875, -1.873046875, -1.2822265625, -0.69140625, -0.1005859375, 0.490234375, 1.0810546875, 1.671875, 2.2626953125, 2.853515625, 3.4443359375, 4.03515625, 4.6259765625, 5.216796875, 5.8076171875, 6.3984375, 6.9892578125, 7.580078125, 8.1708984375, 8.76171875, 9.3525390625, 9.943359375, 10.5341796875, 11.125, 11.7158203125, 12.306640625, 12.8974609375, 13.48828125, 14.0791015625, 14.669921875, 15.2607421875, 15.8515625, 16.4423828125, 17.033203125, 17.6240234375, 18.21484375, 18.8056640625, 19.396484375, 19.9873046875, 20.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 10.0, 9.0, 14.0, 16.0, 23.0, 31.0, 26.0, 28.0, 47.0, 38.0, 36.0, 53.0, 57.0, 41.0, 45.0, 43.0, 47.0, 51.0, 41.0, 41.0, 39.0, 34.0, 39.0, 23.0, 24.0, 20.0, 15.0, 11.0, 12.0, 8.0, 6.0, 9.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.7108154296875, -7.452880859375, -7.1949462890625, -6.93701171875, -6.6790771484375, -6.421142578125, -6.1632080078125, -5.9052734375, -5.6473388671875, -5.389404296875, -5.1314697265625, -4.87353515625, -4.6156005859375, -4.357666015625, -4.0997314453125, -3.841796875, -3.5838623046875, -3.325927734375, -3.0679931640625, -2.81005859375, -2.5521240234375, -2.294189453125, -2.0362548828125, -1.7783203125, -1.5203857421875, -1.262451171875, -1.0045166015625, -0.74658203125, -0.4886474609375, -0.230712890625, 0.0272216796875, 0.28515625, 0.5430908203125, 0.801025390625, 1.0589599609375, 1.31689453125, 1.5748291015625, 1.832763671875, 2.0906982421875, 2.3486328125, 2.6065673828125, 2.864501953125, 3.1224365234375, 3.38037109375, 3.6383056640625, 3.896240234375, 4.1541748046875, 4.412109375, 4.6700439453125, 4.927978515625, 5.1859130859375, 5.44384765625, 5.7017822265625, 5.959716796875, 6.2176513671875, 6.4755859375, 6.7335205078125, 6.991455078125, 7.2493896484375, 7.50732421875, 7.7652587890625, 8.023193359375, 8.2811279296875, 8.5390625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 13.0, 6.0, 3.0, 7.0, 20.0, 25.0, 27.0, 26.0, 29.0, 51.0, 37.0, 53.0, 43.0, 51.0, 48.0, 46.0, 64.0, 52.0, 40.0, 43.0, 41.0, 43.0, 38.0, 30.0, 35.0, 21.0, 22.0, 18.0, 15.0, 8.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.9693832397461, -78.72274780273438, -76.47611999511719, -74.22948455810547, -71.98284912109375, -69.73622131347656, -67.48958587646484, -65.24295043945312, -62.99632263183594, -60.749691009521484, -58.503055572509766, -56.25642395019531, -54.00979232788086, -51.763160705566406, -49.51652526855469, -47.269893646240234, -45.023258209228516, -42.77662658691406, -40.529991149902344, -38.28335952758789, -36.03672790527344, -33.79009246826172, -31.543460845947266, -29.296829223632812, -27.050195693969727, -24.80356216430664, -22.556930541992188, -20.3102970123291, -18.063663482666016, -15.817031860351562, -13.570398330688477, -11.323765754699707, -9.077136993408203, -6.830504417419434, -4.583871364593506, -2.337238311767578, -0.0906057357788086, 2.156026840209961, 4.402660369873047, 6.649292945861816, 8.895925521850586, 11.142558097839355, 13.389190673828125, 15.635824203491211, 17.882457733154297, 20.12908935546875, 22.375722885131836, 24.622356414794922, 26.868988037109375, 29.11562156677246, 31.362253189086914, 33.60888671875, 35.85551834106445, 38.102149963378906, 40.348785400390625, 42.59541702270508, 44.84204864501953, 47.088680267333984, 49.3353157043457, 51.581947326660156, 53.82857894897461, 56.07521057128906, 58.32184600830078, 60.568477630615234, 62.81511306762695]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 7.0, 5.0, 6.0, 11.0, 10.0, 14.0, 14.0, 19.0, 20.0, 16.0, 24.0, 19.0, 29.0, 25.0, 28.0, 41.0, 28.0, 32.0, 34.0, 38.0, 34.0, 35.0, 50.0, 42.0, 32.0, 40.0, 52.0, 38.0, 32.0, 20.0, 30.0, 22.0, 21.0, 20.0, 17.0, 11.0, 20.0, 7.0, 14.0, 8.0, 6.0, 9.0, 14.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.210289001464844, -47.3166389465332, -45.42298889160156, -43.52933883666992, -41.63568878173828, -39.74203872680664, -37.848388671875, -35.95473861694336, -34.06108856201172, -32.16743850708008, -30.273788452148438, -28.380138397216797, -26.486488342285156, -24.592838287353516, -22.699188232421875, -20.805538177490234, -18.911888122558594, -17.018238067626953, -15.124588012695312, -13.230937957763672, -11.337287902832031, -9.44363784790039, -7.54998779296875, -5.656337738037109, -3.7626876831054688, -1.8690376281738281, 0.0246124267578125, 1.9182624816894531, 3.8119125366210938, 5.705562591552734, 7.599212646484375, 9.492862701416016, 11.386512756347656, 13.280162811279297, 15.173812866210938, 17.067462921142578, 18.96111297607422, 20.85476303100586, 22.7484130859375, 24.64206314086914, 26.53571319580078, 28.429363250732422, 30.323013305664062, 32.2166633605957, 34.110313415527344, 36.003963470458984, 37.897613525390625, 39.791263580322266, 41.684913635253906, 43.57856369018555, 45.47221374511719, 47.36586380004883, 49.25951385498047, 51.15316390991211, 53.04681396484375, 54.94046401977539, 56.83411407470703, 58.72776412963867, 60.62141418457031, 62.51506423950195, 64.4087142944336, 66.3023681640625, 68.19601440429688, 70.08966064453125, 71.98331451416016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 8.0, 14.0, 37.0, 78.0, 105.0, 185.0, 367.0, 622.0, 1072.0, 1786.0, 3272.0, 5462.0, 9482.0, 16255.0, 27320.0, 46254.0, 76401.0, 123816.0, 192599.0, 287775.0, 396848.0, 494906.0, 548059.0, 528717.0, 449178.0, 342064.0, 238779.0, 156122.0, 97683.0, 60333.0, 36029.0, 21283.0, 12538.0, 7570.0, 4350.0, 2751.0, 1596.0, 989.0, 585.0, 392.0, 231.0, 124.0, 77.0, 65.0, 42.0, 21.0, 13.0, 13.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.21875, -47.56494140625, -45.9111328125, -44.25732421875, -42.603515625, -40.94970703125, -39.2958984375, -37.64208984375, -35.98828125, -34.33447265625, -32.6806640625, -31.02685546875, -29.373046875, -27.71923828125, -26.0654296875, -24.41162109375, -22.7578125, -21.10400390625, -19.4501953125, -17.79638671875, -16.142578125, -14.48876953125, -12.8349609375, -11.18115234375, -9.52734375, -7.87353515625, -6.2197265625, -4.56591796875, -2.912109375, -1.25830078125, 0.3955078125, 2.04931640625, 3.703125, 5.35693359375, 7.0107421875, 8.66455078125, 10.318359375, 11.97216796875, 13.6259765625, 15.27978515625, 16.93359375, 18.58740234375, 20.2412109375, 21.89501953125, 23.548828125, 25.20263671875, 26.8564453125, 28.51025390625, 30.1640625, 31.81787109375, 33.4716796875, 35.12548828125, 36.779296875, 38.43310546875, 40.0869140625, 41.74072265625, 43.39453125, 45.04833984375, 46.7021484375, 48.35595703125, 50.009765625, 51.66357421875, 53.3173828125, 54.97119140625, 56.625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 9.0, 12.0, 18.0, 12.0, 15.0, 18.0, 26.0, 22.0, 19.0, 28.0, 32.0, 31.0, 33.0, 34.0, 41.0, 39.0, 37.0, 34.0, 50.0, 42.0, 40.0, 33.0, 58.0, 36.0, 32.0, 37.0, 24.0, 25.0, 27.0, 15.0, 16.0, 16.0, 14.0, 16.0, 11.0, 4.0, 11.0, 8.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.2353515625, -43.470703125, -41.7060546875, -39.94140625, -38.1767578125, -36.412109375, -34.6474609375, -32.8828125, -31.1181640625, -29.353515625, -27.5888671875, -25.82421875, -24.0595703125, -22.294921875, -20.5302734375, -18.765625, -17.0009765625, -15.236328125, -13.4716796875, -11.70703125, -9.9423828125, -8.177734375, -6.4130859375, -4.6484375, -2.8837890625, -1.119140625, 0.6455078125, 2.41015625, 4.1748046875, 5.939453125, 7.7041015625, 9.46875, 11.2333984375, 12.998046875, 14.7626953125, 16.52734375, 18.2919921875, 20.056640625, 21.8212890625, 23.5859375, 25.3505859375, 27.115234375, 28.8798828125, 30.64453125, 32.4091796875, 34.173828125, 35.9384765625, 37.703125, 39.4677734375, 41.232421875, 42.9970703125, 44.76171875, 46.5263671875, 48.291015625, 50.0556640625, 51.8203125, 53.5849609375, 55.349609375, 57.1142578125, 58.87890625, 60.6435546875, 62.408203125, 64.1728515625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 18.0, 20.0, 38.0, 61.0, 70.0, 127.0, 217.0, 347.0, 554.0, 850.0, 1461.0, 2496.0, 4118.0, 6591.0, 10900.0, 17607.0, 28185.0, 45196.0, 70206.0, 106360.0, 158942.0, 222483.0, 298108.0, 376806.0, 437719.0, 467376.0, 452248.0, 398707.0, 324433.0, 246083.0, 176631.0, 121236.0, 80127.0, 51918.0, 33282.0, 20410.0, 12422.0, 7885.0, 4689.0, 2832.0, 1783.0, 1063.0, 658.0, 394.0, 230.0, 159.0, 94.0, 50.0, 29.0, 26.0, 14.0, 11.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.625, -49.02587890625, -47.4267578125, -45.82763671875, -44.228515625, -42.62939453125, -41.0302734375, -39.43115234375, -37.83203125, -36.23291015625, -34.6337890625, -33.03466796875, -31.435546875, -29.83642578125, -28.2373046875, -26.63818359375, -25.0390625, -23.43994140625, -21.8408203125, -20.24169921875, -18.642578125, -17.04345703125, -15.4443359375, -13.84521484375, -12.24609375, -10.64697265625, -9.0478515625, -7.44873046875, -5.849609375, -4.25048828125, -2.6513671875, -1.05224609375, 0.546875, 2.14599609375, 3.7451171875, 5.34423828125, 6.943359375, 8.54248046875, 10.1416015625, 11.74072265625, 13.33984375, 14.93896484375, 16.5380859375, 18.13720703125, 19.736328125, 21.33544921875, 22.9345703125, 24.53369140625, 26.1328125, 27.73193359375, 29.3310546875, 30.93017578125, 32.529296875, 34.12841796875, 35.7275390625, 37.32666015625, 38.92578125, 40.52490234375, 42.1240234375, 43.72314453125, 45.322265625, 46.92138671875, 48.5205078125, 50.11962890625, 51.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 12.0, 20.0, 21.0, 23.0, 23.0, 43.0, 38.0, 53.0, 57.0, 57.0, 84.0, 103.0, 105.0, 154.0, 161.0, 150.0, 206.0, 198.0, 199.0, 214.0, 258.0, 215.0, 197.0, 197.0, 190.0, 143.0, 144.0, 143.0, 114.0, 108.0, 83.0, 76.0, 55.0, 43.0, 41.0, 38.0, 27.0, 18.0, 16.0, 7.0, 13.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-27.703125, -26.891357421875, -26.07958984375, -25.267822265625, -24.4560546875, -23.644287109375, -22.83251953125, -22.020751953125, -21.208984375, -20.397216796875, -19.58544921875, -18.773681640625, -17.9619140625, -17.150146484375, -16.33837890625, -15.526611328125, -14.71484375, -13.903076171875, -13.09130859375, -12.279541015625, -11.4677734375, -10.656005859375, -9.84423828125, -9.032470703125, -8.220703125, -7.408935546875, -6.59716796875, -5.785400390625, -4.9736328125, -4.161865234375, -3.35009765625, -2.538330078125, -1.7265625, -0.914794921875, -0.10302734375, 0.708740234375, 1.5205078125, 2.332275390625, 3.14404296875, 3.955810546875, 4.767578125, 5.579345703125, 6.39111328125, 7.202880859375, 8.0146484375, 8.826416015625, 9.63818359375, 10.449951171875, 11.26171875, 12.073486328125, 12.88525390625, 13.697021484375, 14.5087890625, 15.320556640625, 16.13232421875, 16.944091796875, 17.755859375, 18.567626953125, 19.37939453125, 20.191162109375, 21.0029296875, 21.814697265625, 22.62646484375, 23.438232421875, 24.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 19.0, 14.0, 15.0, 13.0, 30.0, 26.0, 25.0, 28.0, 22.0, 35.0, 43.0, 53.0, 29.0, 38.0, 38.0, 41.0, 26.0, 43.0, 24.0, 32.0, 35.0, 33.0, 22.0, 26.0, 26.0, 25.0, 32.0, 18.0, 19.0, 20.0, 19.0, 12.0, 16.0, 14.0, 10.0, 3.0, 8.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-59.39789962768555, -57.643192291259766, -55.888484954833984, -54.1337776184082, -52.37907028198242, -50.62436294555664, -48.869659423828125, -47.114952087402344, -45.36024475097656, -43.60553741455078, -41.850830078125, -40.09612274169922, -38.34141540527344, -36.586708068847656, -34.832000732421875, -33.077293395996094, -31.322586059570312, -29.56787872314453, -27.81317138671875, -26.05846405029297, -24.303756713867188, -22.549049377441406, -20.794343948364258, -19.039636611938477, -17.284929275512695, -15.530221939086914, -13.775514602661133, -12.020808219909668, -10.266100883483887, -8.511393547058105, -6.756687164306641, -5.001979827880859, -3.2472763061523438, -1.4925692081451416, 0.26213788986206055, 2.0168447494506836, 3.771552085876465, 5.526259422302246, 7.280965805053711, 9.035673141479492, 10.790380477905273, 12.545087814331055, 14.299795150756836, 16.054500579833984, 17.809207916259766, 19.563915252685547, 21.318622589111328, 23.07332992553711, 24.82803726196289, 26.582744598388672, 28.337451934814453, 30.092159271240234, 31.846866607666016, 33.6015739440918, 35.35627746582031, 37.110984802246094, 38.865692138671875, 40.620399475097656, 42.37510681152344, 44.12981414794922, 45.884521484375, 47.63922882080078, 49.39393615722656, 51.148643493652344, 52.903350830078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 7.0, 3.0, 8.0, 5.0, 12.0, 9.0, 9.0, 16.0, 15.0, 22.0, 14.0, 24.0, 24.0, 30.0, 27.0, 35.0, 46.0, 46.0, 34.0, 31.0, 33.0, 41.0, 52.0, 33.0, 43.0, 44.0, 38.0, 25.0, 29.0, 34.0, 32.0, 27.0, 21.0, 17.0, 14.0, 17.0, 21.0, 8.0, 8.0, 12.0, 4.0, 12.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.15023422241211, -52.22712326049805, -50.30400848388672, -48.380897521972656, -46.457786560058594, -44.53467559814453, -42.61156463623047, -40.68844985961914, -38.76533889770508, -36.842227935791016, -34.91911315917969, -32.996002197265625, -31.072891235351562, -29.1497802734375, -27.226667404174805, -25.30355453491211, -23.380443572998047, -21.457332611083984, -19.53421974182129, -17.611106872558594, -15.687995910644531, -13.764883995056152, -11.841772079467773, -9.918660163879395, -7.995548248291016, -6.072436332702637, -4.149324417114258, -2.226212501525879, -0.3031005859375, 1.620011329650879, 3.543123245239258, 5.466235160827637, 7.389350891113281, 9.31246280670166, 11.235574722290039, 13.158686637878418, 15.081798553466797, 17.00490951538086, 18.928022384643555, 20.85113525390625, 22.774246215820312, 24.697357177734375, 26.62047004699707, 28.543582916259766, 30.466693878173828, 32.38980484008789, 34.31291961669922, 36.23603057861328, 38.159141540527344, 40.082252502441406, 42.00536346435547, 43.9284782409668, 45.85158920288086, 47.77470016479492, 49.69781494140625, 51.62092590332031, 53.544036865234375, 55.46714782714844, 57.3902587890625, 59.31337356567383, 61.23648452758789, 63.15959548950195, 65.08271026611328, 67.00582122802734, 68.9289321899414]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 13.0, 14.0, 33.0, 43.0, 96.0, 114.0, 161.0, 321.0, 391.0, 664.0, 1039.0, 1594.0, 2375.0, 3608.0, 5380.0, 8190.0, 12297.0, 17823.0, 25515.0, 36011.0, 47812.0, 62428.0, 77262.0, 89817.0, 97215.0, 99835.0, 95552.0, 85812.0, 72442.0, 57470.0, 43955.0, 32337.0, 22960.0, 15866.0, 10802.0, 7350.0, 4857.0, 3199.0, 2036.0, 1370.0, 865.0, 593.0, 372.0, 228.0, 152.0, 105.0, 62.0, 47.0, 28.0, 15.0, 12.0, 4.0, 9.0, 2.0, 0.0, 1.0, 2.0], "bins": [-25.859375, -25.059814453125, -24.26025390625, -23.460693359375, -22.6611328125, -21.861572265625, -21.06201171875, -20.262451171875, -19.462890625, -18.663330078125, -17.86376953125, -17.064208984375, -16.2646484375, -15.465087890625, -14.66552734375, -13.865966796875, -13.06640625, -12.266845703125, -11.46728515625, -10.667724609375, -9.8681640625, -9.068603515625, -8.26904296875, -7.469482421875, -6.669921875, -5.870361328125, -5.07080078125, -4.271240234375, -3.4716796875, -2.672119140625, -1.87255859375, -1.072998046875, -0.2734375, 0.526123046875, 1.32568359375, 2.125244140625, 2.9248046875, 3.724365234375, 4.52392578125, 5.323486328125, 6.123046875, 6.922607421875, 7.72216796875, 8.521728515625, 9.3212890625, 10.120849609375, 10.92041015625, 11.719970703125, 12.51953125, 13.319091796875, 14.11865234375, 14.918212890625, 15.7177734375, 16.517333984375, 17.31689453125, 18.116455078125, 18.916015625, 19.715576171875, 20.51513671875, 21.314697265625, 22.1142578125, 22.913818359375, 23.71337890625, 24.512939453125, 25.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 5.0, 5.0, 5.0, 12.0, 11.0, 11.0, 16.0, 14.0, 20.0, 19.0, 24.0, 19.0, 34.0, 28.0, 39.0, 44.0, 42.0, 34.0, 29.0, 35.0, 43.0, 54.0, 30.0, 44.0, 43.0, 34.0, 24.0, 34.0, 30.0, 37.0, 26.0, 17.0, 15.0, 16.0, 18.0, 17.0, 9.0, 10.0, 9.0, 5.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.58544921875, -50.6396484375, -48.69384765625, -46.748046875, -44.80224609375, -42.8564453125, -40.91064453125, -38.96484375, -37.01904296875, -35.0732421875, -33.12744140625, -31.181640625, -29.23583984375, -27.2900390625, -25.34423828125, -23.3984375, -21.45263671875, -19.5068359375, -17.56103515625, -15.615234375, -13.66943359375, -11.7236328125, -9.77783203125, -7.83203125, -5.88623046875, -3.9404296875, -1.99462890625, -0.048828125, 1.89697265625, 3.8427734375, 5.78857421875, 7.734375, 9.68017578125, 11.6259765625, 13.57177734375, 15.517578125, 17.46337890625, 19.4091796875, 21.35498046875, 23.30078125, 25.24658203125, 27.1923828125, 29.13818359375, 31.083984375, 33.02978515625, 34.9755859375, 36.92138671875, 38.8671875, 40.81298828125, 42.7587890625, 44.70458984375, 46.650390625, 48.59619140625, 50.5419921875, 52.48779296875, 54.43359375, 56.37939453125, 58.3251953125, 60.27099609375, 62.216796875, 64.16259765625, 66.1083984375, 68.05419921875, 70.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 14.0, 25.0, 28.0, 59.0, 104.0, 153.0, 255.0, 385.0, 690.0, 1088.0, 1680.0, 2699.0, 4448.0, 7208.0, 11488.0, 18255.0, 30632.0, 290415.0, 589939.0, 35324.0, 20022.0, 12766.0, 7962.0, 4826.0, 3078.0, 1957.0, 1142.0, 705.0, 476.0, 281.0, 173.0, 102.0, 68.0, 34.0, 32.0, 7.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-65.5, -63.4599609375, -61.419921875, -59.3798828125, -57.33984375, -55.2998046875, -53.259765625, -51.2197265625, -49.1796875, -47.1396484375, -45.099609375, -43.0595703125, -41.01953125, -38.9794921875, -36.939453125, -34.8994140625, -32.859375, -30.8193359375, -28.779296875, -26.7392578125, -24.69921875, -22.6591796875, -20.619140625, -18.5791015625, -16.5390625, -14.4990234375, -12.458984375, -10.4189453125, -8.37890625, -6.3388671875, -4.298828125, -2.2587890625, -0.21875, 1.8212890625, 3.861328125, 5.9013671875, 7.94140625, 9.9814453125, 12.021484375, 14.0615234375, 16.1015625, 18.1416015625, 20.181640625, 22.2216796875, 24.26171875, 26.3017578125, 28.341796875, 30.3818359375, 32.421875, 34.4619140625, 36.501953125, 38.5419921875, 40.58203125, 42.6220703125, 44.662109375, 46.7021484375, 48.7421875, 50.7822265625, 52.822265625, 54.8623046875, 56.90234375, 58.9423828125, 60.982421875, 63.0224609375, 65.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 9.0, 8.0, 11.0, 13.0, 26.0, 22.0, 19.0, 23.0, 21.0, 19.0, 33.0, 30.0, 29.0, 25.0, 36.0, 40.0, 27.0, 19.0, 37.0, 43.0, 35.0, 44.0, 39.0, 39.0, 49.0, 33.0, 33.0, 32.0, 26.0, 18.0, 15.0, 29.0, 20.0, 16.0, 18.0, 7.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.65625, -43.236328125, -41.81640625, -40.396484375, -38.9765625, -37.556640625, -36.13671875, -34.716796875, -33.296875, -31.876953125, -30.45703125, -29.037109375, -27.6171875, -26.197265625, -24.77734375, -23.357421875, -21.9375, -20.517578125, -19.09765625, -17.677734375, -16.2578125, -14.837890625, -13.41796875, -11.998046875, -10.578125, -9.158203125, -7.73828125, -6.318359375, -4.8984375, -3.478515625, -2.05859375, -0.638671875, 0.78125, 2.201171875, 3.62109375, 5.041015625, 6.4609375, 7.880859375, 9.30078125, 10.720703125, 12.140625, 13.560546875, 14.98046875, 16.400390625, 17.8203125, 19.240234375, 20.66015625, 22.080078125, 23.5, 24.919921875, 26.33984375, 27.759765625, 29.1796875, 30.599609375, 32.01953125, 33.439453125, 34.859375, 36.279296875, 37.69921875, 39.119140625, 40.5390625, 41.958984375, 43.37890625, 44.798828125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 16.0, 20.0, 34.0, 30.0, 55.0, 73.0, 93.0, 128.0, 201.0, 288.0, 414.0, 567.0, 832.0, 1202.0, 1978.0, 2967.0, 4580.0, 7203.0, 12228.0, 21373.0, 49879.0, 712994.0, 161159.0, 28935.0, 15589.0, 9273.0, 5800.0, 3625.0, 2216.0, 1541.0, 1018.0, 695.0, 436.0, 308.0, 208.0, 150.0, 138.0, 78.0, 55.0, 46.0, 27.0, 21.0, 12.0, 11.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.15234375, -4.0126953125, -3.873046875, -3.7333984375, -3.59375, -3.4541015625, -3.314453125, -3.1748046875, -3.03515625, -2.8955078125, -2.755859375, -2.6162109375, -2.4765625, -2.3369140625, -2.197265625, -2.0576171875, -1.91796875, -1.7783203125, -1.638671875, -1.4990234375, -1.359375, -1.2197265625, -1.080078125, -0.9404296875, -0.80078125, -0.6611328125, -0.521484375, -0.3818359375, -0.2421875, -0.1025390625, 0.037109375, 0.1767578125, 0.31640625, 0.4560546875, 0.595703125, 0.7353515625, 0.875, 1.0146484375, 1.154296875, 1.2939453125, 1.43359375, 1.5732421875, 1.712890625, 1.8525390625, 1.9921875, 2.1318359375, 2.271484375, 2.4111328125, 2.55078125, 2.6904296875, 2.830078125, 2.9697265625, 3.109375, 3.2490234375, 3.388671875, 3.5283203125, 3.66796875, 3.8076171875, 3.947265625, 4.0869140625, 4.2265625, 4.3662109375, 4.505859375, 4.6455078125, 4.78515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 8.0, 13.0, 12.0, 11.0, 15.0, 14.0, 31.0, 29.0, 27.0, 37.0, 40.0, 30.0, 56.0, 51.0, 72.0, 52.0, 56.0, 54.0, 43.0, 42.0, 50.0, 34.0, 33.0, 35.0, 29.0, 22.0, 21.0, 17.0, 14.0, 12.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007371902465820312, -0.0007062405347824097, -0.0006752908229827881, -0.0006443411111831665, -0.0006133913993835449, -0.0005824416875839233, -0.0005514919757843018, -0.0005205422639846802, -0.0004895925521850586, -0.000458642840385437, -0.00042769312858581543, -0.00039674341678619385, -0.00036579370498657227, -0.0003348439931869507, -0.0003038942813873291, -0.0002729445695877075, -0.00024199485778808594, -0.00021104514598846436, -0.00018009543418884277, -0.0001491457223892212, -0.00011819601058959961, -8.724629878997803e-05, -5.6296586990356445e-05, -2.5346875190734863e-05, 5.602836608886719e-06, 3.65525484085083e-05, 6.750226020812988e-05, 9.845197200775146e-05, 0.00012940168380737305, 0.00016035139560699463, 0.0001913011074066162, 0.0002222508192062378, 0.0002532005310058594, 0.00028415024280548096, 0.00031509995460510254, 0.0003460496664047241, 0.0003769993782043457, 0.0004079490900039673, 0.00043889880180358887, 0.00046984851360321045, 0.000500798225402832, 0.0005317479372024536, 0.0005626976490020752, 0.0005936473608016968, 0.0006245970726013184, 0.0006555467844009399, 0.0006864964962005615, 0.0007174462080001831, 0.0007483959197998047, 0.0007793456315994263, 0.0008102953433990479, 0.0008412450551986694, 0.000872194766998291, 0.0009031444787979126, 0.0009340941905975342, 0.0009650439023971558, 0.0009959936141967773, 0.001026943325996399, 0.0010578930377960205, 0.001088842749595642, 0.0011197924613952637, 0.0011507421731948853, 0.0011816918849945068, 0.0012126415967941284, 0.00124359130859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 11.0, 18.0, 36.0, 47.0, 44.0, 72.0, 129.0, 169.0, 329.0, 462.0, 918.0, 1639.0, 2957.0, 5474.0, 9860.0, 18464.0, 33899.0, 60495.0, 99951.0, 144459.0, 173684.0, 167542.0, 130692.0, 84932.0, 50667.0, 27940.0, 15214.0, 8239.0, 4471.0, 2399.0, 1373.0, 727.0, 415.0, 285.0, 172.0, 115.0, 80.0, 59.0, 30.0, 19.0, 19.0, 6.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.1640625, -3.070556640625, -2.97705078125, -2.883544921875, -2.7900390625, -2.696533203125, -2.60302734375, -2.509521484375, -2.416015625, -2.322509765625, -2.22900390625, -2.135498046875, -2.0419921875, -1.948486328125, -1.85498046875, -1.761474609375, -1.66796875, -1.574462890625, -1.48095703125, -1.387451171875, -1.2939453125, -1.200439453125, -1.10693359375, -1.013427734375, -0.919921875, -0.826416015625, -0.73291015625, -0.639404296875, -0.5458984375, -0.452392578125, -0.35888671875, -0.265380859375, -0.171875, -0.078369140625, 0.01513671875, 0.108642578125, 0.2021484375, 0.295654296875, 0.38916015625, 0.482666015625, 0.576171875, 0.669677734375, 0.76318359375, 0.856689453125, 0.9501953125, 1.043701171875, 1.13720703125, 1.230712890625, 1.32421875, 1.417724609375, 1.51123046875, 1.604736328125, 1.6982421875, 1.791748046875, 1.88525390625, 1.978759765625, 2.072265625, 2.165771484375, 2.25927734375, 2.352783203125, 2.4462890625, 2.539794921875, 2.63330078125, 2.726806640625, 2.8203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 11.0, 14.0, 13.0, 13.0, 27.0, 13.0, 30.0, 27.0, 18.0, 29.0, 37.0, 24.0, 39.0, 31.0, 33.0, 37.0, 40.0, 48.0, 44.0, 45.0, 45.0, 44.0, 31.0, 22.0, 43.0, 32.0, 22.0, 28.0, 24.0, 9.0, 16.0, 13.0, 11.0, 14.0, 20.0, 5.0, 4.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8568801879882812, -0.8246002197265625, -0.7923202514648438, -0.760040283203125, -0.7277603149414062, -0.6954803466796875, -0.6632003784179688, -0.63092041015625, -0.5986404418945312, -0.5663604736328125, -0.5340805053710938, -0.501800537109375, -0.46952056884765625, -0.4372406005859375, -0.40496063232421875, -0.3726806640625, -0.34040069580078125, -0.3081207275390625, -0.27584075927734375, -0.243560791015625, -0.21128082275390625, -0.1790008544921875, -0.14672088623046875, -0.11444091796875, -0.08216094970703125, -0.0498809814453125, -0.01760101318359375, 0.014678955078125, 0.04695892333984375, 0.0792388916015625, 0.11151885986328125, 0.143798828125, 0.17607879638671875, 0.2083587646484375, 0.24063873291015625, 0.272918701171875, 0.30519866943359375, 0.3374786376953125, 0.36975860595703125, 0.40203857421875, 0.43431854248046875, 0.4665985107421875, 0.49887847900390625, 0.531158447265625, 0.5634384155273438, 0.5957183837890625, 0.6279983520507812, 0.6602783203125, 0.6925582885742188, 0.7248382568359375, 0.7571182250976562, 0.789398193359375, 0.8216781616210938, 0.8539581298828125, 0.8862380981445312, 0.91851806640625, 0.9507980346679688, 0.9830780029296875, 1.0153579711914062, 1.047637939453125, 1.0799179077148438, 1.1121978759765625, 1.1444778442382812, 1.1767578125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 3.0, 4.0, 5.0, 14.0, 12.0, 5.0, 14.0, 16.0, 22.0, 16.0, 13.0, 29.0, 25.0, 29.0, 24.0, 32.0, 30.0, 40.0, 45.0, 36.0, 35.0, 31.0, 54.0, 45.0, 37.0, 25.0, 17.0, 34.0, 29.0, 27.0, 34.0, 23.0, 24.0, 23.0, 29.0, 15.0, 18.0, 12.0, 15.0, 10.0, 7.0, 15.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-61.922672271728516, -60.123634338378906, -58.32460021972656, -56.52556228637695, -54.726524353027344, -52.927486419677734, -51.128448486328125, -49.32941436767578, -47.53037643432617, -45.73133850097656, -43.93230438232422, -42.13326644897461, -40.334228515625, -38.53519058227539, -36.73615264892578, -34.93711853027344, -33.13808059692383, -31.33904266357422, -29.540006637573242, -27.740970611572266, -25.941932678222656, -24.142894744873047, -22.34385871887207, -20.544822692871094, -18.745784759521484, -16.946746826171875, -15.147710800170898, -13.348673820495605, -11.549636840820312, -9.75059986114502, -7.951562881469727, -6.152525901794434, -4.353485107421875, -2.554448127746582, -0.7554111480712891, 1.043625831604004, 2.842662811279297, 4.64169979095459, 6.440736770629883, 8.239773750305176, 10.038810729980469, 11.837847709655762, 13.636884689331055, 15.435921669006348, 17.23495864868164, 19.03399658203125, 20.833032608032227, 22.632068634033203, 24.431106567382812, 26.230144500732422, 28.0291805267334, 29.828216552734375, 31.627254486083984, 33.426292419433594, 35.22532653808594, 37.02436447143555, 38.823402404785156, 40.622440338134766, 42.421478271484375, 44.22051239013672, 46.01955032348633, 47.81858825683594, 49.61762237548828, 51.41666030883789, 53.2156982421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 9.0, 6.0, 12.0, 12.0, 21.0, 16.0, 12.0, 19.0, 24.0, 24.0, 30.0, 31.0, 35.0, 46.0, 41.0, 38.0, 27.0, 30.0, 41.0, 52.0, 36.0, 48.0, 31.0, 41.0, 28.0, 30.0, 39.0, 24.0, 24.0, 21.0, 16.0, 12.0, 23.0, 11.0, 14.0, 6.0, 15.0, 8.0, 7.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.10070037841797, -52.170501708984375, -50.24030303955078, -48.31010818481445, -46.37990951538086, -44.449710845947266, -42.51951599121094, -40.589317321777344, -38.65911865234375, -36.728919982910156, -34.79872131347656, -32.868526458740234, -30.93832778930664, -29.008129119873047, -27.077932357788086, -25.147735595703125, -23.21753692626953, -21.287338256835938, -19.357141494750977, -17.426944732666016, -15.496746063232422, -13.566548347473145, -11.636350631713867, -9.70615291595459, -7.7759552001953125, -5.845757484436035, -3.915559768676758, -1.9853620529174805, -0.055164337158203125, 1.8750333786010742, 3.8052310943603516, 5.735428810119629, 7.665626525878906, 9.595824241638184, 11.526021957397461, 13.456219673156738, 15.386417388916016, 17.31661605834961, 19.24681282043457, 21.17700958251953, 23.107208251953125, 25.03740692138672, 26.96760368347168, 28.89780044555664, 30.827999114990234, 32.75819778442383, 34.688392639160156, 36.61859130859375, 38.548789978027344, 40.47898864746094, 42.40918731689453, 44.33938217163086, 46.26958084106445, 48.19977951049805, 50.129974365234375, 52.06017303466797, 53.99037170410156, 55.920570373535156, 57.85076904296875, 59.78096389770508, 61.71116256713867, 63.641361236572266, 65.5715560913086, 67.50175476074219, 69.43195343017578]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 23.0, 32.0, 45.0, 93.0, 154.0, 263.0, 482.0, 836.0, 1606.0, 2889.0, 5478.0, 10367.0, 18643.0, 32824.0, 54837.0, 85412.0, 118716.0, 145552.0, 151630.0, 136410.0, 105598.0, 72402.0, 45511.0, 26568.0, 14945.0, 7973.0, 4194.0, 2243.0, 1265.0, 652.0, 363.0, 209.0, 127.0, 76.0, 51.0, 33.0, 19.0, 10.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -67.8330078125, -65.666015625, -63.4990234375, -61.33203125, -59.1650390625, -56.998046875, -54.8310546875, -52.6640625, -50.4970703125, -48.330078125, -46.1630859375, -43.99609375, -41.8291015625, -39.662109375, -37.4951171875, -35.328125, -33.1611328125, -30.994140625, -28.8271484375, -26.66015625, -24.4931640625, -22.326171875, -20.1591796875, -17.9921875, -15.8251953125, -13.658203125, -11.4912109375, -9.32421875, -7.1572265625, -4.990234375, -2.8232421875, -0.65625, 1.5107421875, 3.677734375, 5.8447265625, 8.01171875, 10.1787109375, 12.345703125, 14.5126953125, 16.6796875, 18.8466796875, 21.013671875, 23.1806640625, 25.34765625, 27.5146484375, 29.681640625, 31.8486328125, 34.015625, 36.1826171875, 38.349609375, 40.5166015625, 42.68359375, 44.8505859375, 47.017578125, 49.1845703125, 51.3515625, 53.5185546875, 55.685546875, 57.8525390625, 60.01953125, 62.1865234375, 64.353515625, 66.5205078125, 68.6875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 9.0, 5.0, 10.0, 14.0, 19.0, 17.0, 13.0, 22.0, 19.0, 28.0, 26.0, 32.0, 32.0, 47.0, 36.0, 43.0, 28.0, 35.0, 39.0, 44.0, 45.0, 36.0, 42.0, 40.0, 29.0, 34.0, 30.0, 34.0, 24.0, 16.0, 17.0, 12.0, 20.0, 14.0, 12.0, 9.0, 14.0, 8.0, 7.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.65625, -49.81591796875, -47.9755859375, -46.13525390625, -44.294921875, -42.45458984375, -40.6142578125, -38.77392578125, -36.93359375, -35.09326171875, -33.2529296875, -31.41259765625, -29.572265625, -27.73193359375, -25.8916015625, -24.05126953125, -22.2109375, -20.37060546875, -18.5302734375, -16.68994140625, -14.849609375, -13.00927734375, -11.1689453125, -9.32861328125, -7.48828125, -5.64794921875, -3.8076171875, -1.96728515625, -0.126953125, 1.71337890625, 3.5537109375, 5.39404296875, 7.234375, 9.07470703125, 10.9150390625, 12.75537109375, 14.595703125, 16.43603515625, 18.2763671875, 20.11669921875, 21.95703125, 23.79736328125, 25.6376953125, 27.47802734375, 29.318359375, 31.15869140625, 32.9990234375, 34.83935546875, 36.6796875, 38.52001953125, 40.3603515625, 42.20068359375, 44.041015625, 45.88134765625, 47.7216796875, 49.56201171875, 51.40234375, 53.24267578125, 55.0830078125, 56.92333984375, 58.763671875, 60.60400390625, 62.4443359375, 64.28466796875, 66.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 10.0, 6.0, 10.0, 10.0, 21.0, 43.0, 56.0, 84.0, 132.0, 191.0, 305.0, 509.0, 760.0, 1236.0, 1933.0, 3208.0, 5043.0, 7806.0, 12221.0, 18696.0, 28069.0, 40598.0, 56324.0, 75794.0, 93522.0, 107699.0, 114245.0, 109883.0, 97445.0, 79486.0, 61035.0, 43802.0, 30917.0, 20492.0, 13426.0, 8664.0, 5431.0, 3533.0, 2221.0, 1369.0, 841.0, 512.0, 332.0, 221.0, 141.0, 89.0, 62.0, 47.0, 21.0, 20.0, 13.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.96875, -48.33642578125, -46.7041015625, -45.07177734375, -43.439453125, -41.80712890625, -40.1748046875, -38.54248046875, -36.91015625, -35.27783203125, -33.6455078125, -32.01318359375, -30.380859375, -28.74853515625, -27.1162109375, -25.48388671875, -23.8515625, -22.21923828125, -20.5869140625, -18.95458984375, -17.322265625, -15.68994140625, -14.0576171875, -12.42529296875, -10.79296875, -9.16064453125, -7.5283203125, -5.89599609375, -4.263671875, -2.63134765625, -0.9990234375, 0.63330078125, 2.265625, 3.89794921875, 5.5302734375, 7.16259765625, 8.794921875, 10.42724609375, 12.0595703125, 13.69189453125, 15.32421875, 16.95654296875, 18.5888671875, 20.22119140625, 21.853515625, 23.48583984375, 25.1181640625, 26.75048828125, 28.3828125, 30.01513671875, 31.6474609375, 33.27978515625, 34.912109375, 36.54443359375, 38.1767578125, 39.80908203125, 41.44140625, 43.07373046875, 44.7060546875, 46.33837890625, 47.970703125, 49.60302734375, 51.2353515625, 52.86767578125, 54.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 12.0, 4.0, 14.0, 13.0, 11.0, 21.0, 10.0, 25.0, 18.0, 25.0, 19.0, 25.0, 26.0, 41.0, 34.0, 35.0, 38.0, 36.0, 47.0, 45.0, 59.0, 41.0, 40.0, 43.0, 42.0, 32.0, 35.0, 30.0, 29.0, 17.0, 20.0, 29.0, 10.0, 14.0, 8.0, 8.0, 12.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.625, -36.40673828125, -35.1884765625, -33.97021484375, -32.751953125, -31.53369140625, -30.3154296875, -29.09716796875, -27.87890625, -26.66064453125, -25.4423828125, -24.22412109375, -23.005859375, -21.78759765625, -20.5693359375, -19.35107421875, -18.1328125, -16.91455078125, -15.6962890625, -14.47802734375, -13.259765625, -12.04150390625, -10.8232421875, -9.60498046875, -8.38671875, -7.16845703125, -5.9501953125, -4.73193359375, -3.513671875, -2.29541015625, -1.0771484375, 0.14111328125, 1.359375, 2.57763671875, 3.7958984375, 5.01416015625, 6.232421875, 7.45068359375, 8.6689453125, 9.88720703125, 11.10546875, 12.32373046875, 13.5419921875, 14.76025390625, 15.978515625, 17.19677734375, 18.4150390625, 19.63330078125, 20.8515625, 22.06982421875, 23.2880859375, 24.50634765625, 25.724609375, 26.94287109375, 28.1611328125, 29.37939453125, 30.59765625, 31.81591796875, 33.0341796875, 34.25244140625, 35.470703125, 36.68896484375, 37.9072265625, 39.12548828125, 40.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 11.0, 13.0, 12.0, 36.0, 27.0, 55.0, 85.0, 150.0, 223.0, 356.0, 598.0, 1078.0, 2152.0, 4187.0, 8555.0, 17692.0, 35574.0, 69833.0, 123960.0, 181024.0, 202795.0, 169482.0, 109806.0, 60399.0, 30620.0, 14842.0, 7153.0, 3582.0, 1843.0, 1006.0, 572.0, 318.0, 193.0, 123.0, 62.0, 48.0, 25.0, 26.0, 13.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.30078125, -28.3671875, -27.43359375, -26.5, -25.56640625, -24.6328125, -23.69921875, -22.765625, -21.83203125, -20.8984375, -19.96484375, -19.03125, -18.09765625, -17.1640625, -16.23046875, -15.296875, -14.36328125, -13.4296875, -12.49609375, -11.5625, -10.62890625, -9.6953125, -8.76171875, -7.828125, -6.89453125, -5.9609375, -5.02734375, -4.09375, -3.16015625, -2.2265625, -1.29296875, -0.359375, 0.57421875, 1.5078125, 2.44140625, 3.375, 4.30859375, 5.2421875, 6.17578125, 7.109375, 8.04296875, 8.9765625, 9.91015625, 10.84375, 11.77734375, 12.7109375, 13.64453125, 14.578125, 15.51171875, 16.4453125, 17.37890625, 18.3125, 19.24609375, 20.1796875, 21.11328125, 22.046875, 22.98046875, 23.9140625, 24.84765625, 25.78125, 26.71484375, 27.6484375, 28.58203125, 29.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 10.0, 11.0, 8.0, 8.0, 18.0, 25.0, 34.0, 33.0, 54.0, 60.0, 65.0, 72.0, 71.0, 91.0, 69.0, 83.0, 61.0, 49.0, 40.0, 45.0, 33.0, 15.0, 14.0, 14.0, 7.0, 8.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.005054473876953125, -0.00494047999382019, -0.004826486110687256, -0.004712492227554321, -0.004598498344421387, -0.004484504461288452, -0.004370510578155518, -0.004256516695022583, -0.0041425228118896484, -0.004028528928756714, -0.003914535045623779, -0.0038005411624908447, -0.00368654727935791, -0.0035725533962249756, -0.003458559513092041, -0.0033445656299591064, -0.003230571746826172, -0.0031165778636932373, -0.0030025839805603027, -0.002888590097427368, -0.0027745962142944336, -0.002660602331161499, -0.0025466084480285645, -0.00243261456489563, -0.0023186206817626953, -0.0022046267986297607, -0.002090632915496826, -0.0019766390323638916, -0.001862645149230957, -0.0017486512660980225, -0.0016346573829650879, -0.0015206634998321533, -0.0014066696166992188, -0.0012926757335662842, -0.0011786818504333496, -0.001064687967300415, -0.0009506940841674805, -0.0008367002010345459, -0.0007227063179016113, -0.0006087124347686768, -0.0004947185516357422, -0.0003807246685028076, -0.00026673078536987305, -0.00015273690223693848, -3.8743019104003906e-05, 7.525086402893066e-05, 0.00018924474716186523, 0.0003032386302947998, 0.0004172325134277344, 0.0005312263965606689, 0.0006452202796936035, 0.0007592141628265381, 0.0008732080459594727, 0.0009872019290924072, 0.0011011958122253418, 0.0012151896953582764, 0.001329183578491211, 0.0014431774616241455, 0.00155717134475708, 0.0016711652278900146, 0.0017851591110229492, 0.0018991529941558838, 0.0020131468772888184, 0.002127140760421753, 0.0022411346435546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 8.0, 7.0, 11.0, 18.0, 26.0, 46.0, 53.0, 91.0, 156.0, 268.0, 369.0, 628.0, 1035.0, 1678.0, 2683.0, 4770.0, 8837.0, 16130.0, 29619.0, 51987.0, 86848.0, 130224.0, 165309.0, 170468.0, 141135.0, 98507.0, 60199.0, 34386.0, 18875.0, 10412.0, 5687.0, 3243.0, 1931.0, 1108.0, 647.0, 419.0, 254.0, 147.0, 109.0, 95.0, 44.0, 27.0, 22.0, 12.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.734375, -24.88037109375, -24.0263671875, -23.17236328125, -22.318359375, -21.46435546875, -20.6103515625, -19.75634765625, -18.90234375, -18.04833984375, -17.1943359375, -16.34033203125, -15.486328125, -14.63232421875, -13.7783203125, -12.92431640625, -12.0703125, -11.21630859375, -10.3623046875, -9.50830078125, -8.654296875, -7.80029296875, -6.9462890625, -6.09228515625, -5.23828125, -4.38427734375, -3.5302734375, -2.67626953125, -1.822265625, -0.96826171875, -0.1142578125, 0.73974609375, 1.59375, 2.44775390625, 3.3017578125, 4.15576171875, 5.009765625, 5.86376953125, 6.7177734375, 7.57177734375, 8.42578125, 9.27978515625, 10.1337890625, 10.98779296875, 11.841796875, 12.69580078125, 13.5498046875, 14.40380859375, 15.2578125, 16.11181640625, 16.9658203125, 17.81982421875, 18.673828125, 19.52783203125, 20.3818359375, 21.23583984375, 22.08984375, 22.94384765625, 23.7978515625, 24.65185546875, 25.505859375, 26.35986328125, 27.2138671875, 28.06787109375, 28.921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 12.0, 17.0, 25.0, 24.0, 29.0, 38.0, 50.0, 65.0, 70.0, 84.0, 68.0, 64.0, 84.0, 55.0, 56.0, 53.0, 42.0, 42.0, 17.0, 26.0, 14.0, 16.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -12.9974365234375, -12.533935546875, -12.0704345703125, -11.60693359375, -11.1434326171875, -10.679931640625, -10.2164306640625, -9.7529296875, -9.2894287109375, -8.825927734375, -8.3624267578125, -7.89892578125, -7.4354248046875, -6.971923828125, -6.5084228515625, -6.044921875, -5.5814208984375, -5.117919921875, -4.6544189453125, -4.19091796875, -3.7274169921875, -3.263916015625, -2.8004150390625, -2.3369140625, -1.8734130859375, -1.409912109375, -0.9464111328125, -0.48291015625, -0.0194091796875, 0.444091796875, 0.9075927734375, 1.37109375, 1.8345947265625, 2.298095703125, 2.7615966796875, 3.22509765625, 3.6885986328125, 4.152099609375, 4.6156005859375, 5.0791015625, 5.5426025390625, 6.006103515625, 6.4696044921875, 6.93310546875, 7.3966064453125, 7.860107421875, 8.3236083984375, 8.787109375, 9.2506103515625, 9.714111328125, 10.1776123046875, 10.64111328125, 11.1046142578125, 11.568115234375, 12.0316162109375, 12.4951171875, 12.9586181640625, 13.422119140625, 13.8856201171875, 14.34912109375, 14.8126220703125, 15.276123046875, 15.7396240234375, 16.203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 10.0, 16.0, 22.0, 18.0, 22.0, 31.0, 27.0, 32.0, 37.0, 37.0, 35.0, 42.0, 47.0, 34.0, 50.0, 45.0, 38.0, 24.0, 40.0, 27.0, 23.0, 27.0, 36.0, 25.0, 33.0, 31.0, 25.0, 21.0, 21.0, 19.0, 10.0, 14.0, 8.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.84510803222656, -58.98116683959961, -57.11722946166992, -55.25328826904297, -53.389347076416016, -51.52540588378906, -49.661468505859375, -47.79752731323242, -45.93358612060547, -44.069644927978516, -42.20570755004883, -40.341766357421875, -38.47782516479492, -36.61388397216797, -34.74994659423828, -32.88600540161133, -31.02206802368164, -29.15812873840332, -27.294187545776367, -25.430248260498047, -23.566307067871094, -21.702367782592773, -19.838428497314453, -17.9744873046875, -16.11054801940918, -14.246607780456543, -12.382667541503906, -10.518728256225586, -8.65478801727295, -6.7908477783203125, -4.926908493041992, -3.0629682540893555, -1.1990318298339844, 0.6649081707000732, 2.528848171234131, 4.392787933349609, 6.256728172302246, 8.120668411254883, 9.984607696533203, 11.84854793548584, 13.712488174438477, 15.576428413391113, 17.44036865234375, 19.30430793762207, 21.16824722290039, 23.032188415527344, 24.896127700805664, 26.760066986083984, 28.624008178710938, 30.487947463989258, 32.35188674926758, 34.21582794189453, 36.079769134521484, 37.94371032714844, 39.807647705078125, 41.67158889770508, 43.53553009033203, 45.399471282958984, 47.26340866088867, 49.127349853515625, 50.99129104614258, 52.85523223876953, 54.71916961669922, 56.58311080932617, 58.44704818725586]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 2.0, 9.0, 11.0, 16.0, 13.0, 9.0, 19.0, 18.0, 32.0, 31.0, 25.0, 37.0, 32.0, 25.0, 42.0, 36.0, 36.0, 40.0, 40.0, 36.0, 32.0, 41.0, 33.0, 43.0, 41.0, 30.0, 20.0, 32.0, 35.0, 24.0, 26.0, 16.0, 14.0, 13.0, 14.0, 9.0, 14.0, 10.0, 3.0, 11.0, 8.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.64284133911133, -52.721534729003906, -50.800228118896484, -48.87892150878906, -46.95761489868164, -45.03630828857422, -43.1150016784668, -41.193695068359375, -39.27238845825195, -37.35108184814453, -35.42977523803711, -33.50846862792969, -31.587162017822266, -29.665855407714844, -27.744548797607422, -25.8232421875, -23.901935577392578, -21.980628967285156, -20.059322357177734, -18.138015747070312, -16.21670913696289, -14.295402526855469, -12.374095916748047, -10.452789306640625, -8.531482696533203, -6.610176086425781, -4.688869476318359, -2.7675628662109375, -0.8462562561035156, 1.0750503540039062, 2.996356964111328, 4.91766357421875, 6.838966369628906, 8.760272979736328, 10.68157958984375, 12.602886199951172, 14.524192810058594, 16.445499420166016, 18.366806030273438, 20.28811264038086, 22.20941925048828, 24.130725860595703, 26.052032470703125, 27.973339080810547, 29.89464569091797, 31.81595230102539, 33.73725891113281, 35.658565521240234, 37.579872131347656, 39.50117874145508, 41.4224853515625, 43.34379196166992, 45.265098571777344, 47.186405181884766, 49.10771179199219, 51.02901840209961, 52.95032501220703, 54.87163162231445, 56.792938232421875, 58.7142448425293, 60.63555145263672, 62.55685806274414, 64.47816467285156, 66.39947509765625, 68.3207778930664]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 20.0, 46.0, 59.0, 123.0, 174.0, 298.0, 485.0, 803.0, 1253.0, 2126.0, 3530.0, 5505.0, 9112.0, 14945.0, 24060.0, 38424.0, 60402.0, 92812.0, 140249.0, 203516.0, 280648.0, 364383.0, 438720.0, 476999.0, 470202.0, 420598.0, 343168.0, 260727.0, 185471.0, 126067.0, 83052.0, 54487.0, 34546.0, 21552.0, 13518.0, 8436.0, 5191.0, 3225.0, 2025.0, 1231.0, 734.0, 498.0, 314.0, 202.0, 125.0, 65.0, 45.0, 29.0, 23.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0], "bins": [-46.8125, -45.388671875, -43.96484375, -42.541015625, -41.1171875, -39.693359375, -38.26953125, -36.845703125, -35.421875, -33.998046875, -32.57421875, -31.150390625, -29.7265625, -28.302734375, -26.87890625, -25.455078125, -24.03125, -22.607421875, -21.18359375, -19.759765625, -18.3359375, -16.912109375, -15.48828125, -14.064453125, -12.640625, -11.216796875, -9.79296875, -8.369140625, -6.9453125, -5.521484375, -4.09765625, -2.673828125, -1.25, 0.173828125, 1.59765625, 3.021484375, 4.4453125, 5.869140625, 7.29296875, 8.716796875, 10.140625, 11.564453125, 12.98828125, 14.412109375, 15.8359375, 17.259765625, 18.68359375, 20.107421875, 21.53125, 22.955078125, 24.37890625, 25.802734375, 27.2265625, 28.650390625, 30.07421875, 31.498046875, 32.921875, 34.345703125, 35.76953125, 37.193359375, 38.6171875, 40.041015625, 41.46484375, 42.888671875, 44.3125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 14.0, 12.0, 15.0, 23.0, 14.0, 28.0, 32.0, 34.0, 40.0, 30.0, 34.0, 36.0, 37.0, 27.0, 43.0, 47.0, 43.0, 36.0, 36.0, 41.0, 43.0, 30.0, 28.0, 32.0, 31.0, 29.0, 25.0, 12.0, 18.0, 22.0, 5.0, 13.0, 14.0, 8.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.65283203125, -44.9306640625, -43.20849609375, -41.486328125, -39.76416015625, -38.0419921875, -36.31982421875, -34.59765625, -32.87548828125, -31.1533203125, -29.43115234375, -27.708984375, -25.98681640625, -24.2646484375, -22.54248046875, -20.8203125, -19.09814453125, -17.3759765625, -15.65380859375, -13.931640625, -12.20947265625, -10.4873046875, -8.76513671875, -7.04296875, -5.32080078125, -3.5986328125, -1.87646484375, -0.154296875, 1.56787109375, 3.2900390625, 5.01220703125, 6.734375, 8.45654296875, 10.1787109375, 11.90087890625, 13.623046875, 15.34521484375, 17.0673828125, 18.78955078125, 20.51171875, 22.23388671875, 23.9560546875, 25.67822265625, 27.400390625, 29.12255859375, 30.8447265625, 32.56689453125, 34.2890625, 36.01123046875, 37.7333984375, 39.45556640625, 41.177734375, 42.89990234375, 44.6220703125, 46.34423828125, 48.06640625, 49.78857421875, 51.5107421875, 53.23291015625, 54.955078125, 56.67724609375, 58.3994140625, 60.12158203125, 61.84375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 12.0, 17.0, 30.0, 57.0, 114.0, 155.0, 317.0, 517.0, 909.0, 1703.0, 2894.0, 5337.0, 9258.0, 16180.0, 27868.0, 46970.0, 76536.0, 121801.0, 185460.0, 265494.0, 358204.0, 441560.0, 495081.0, 498400.0, 452484.0, 371805.0, 280442.0, 197543.0, 131098.0, 83177.0, 51024.0, 30400.0, 17688.0, 10230.0, 5962.0, 3311.0, 1824.0, 1051.0, 570.0, 315.0, 221.0, 110.0, 64.0, 32.0, 27.0, 11.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.7578125, -48.046875, -46.3359375, -44.625, -42.9140625, -41.203125, -39.4921875, -37.78125, -36.0703125, -34.359375, -32.6484375, -30.9375, -29.2265625, -27.515625, -25.8046875, -24.09375, -22.3828125, -20.671875, -18.9609375, -17.25, -15.5390625, -13.828125, -12.1171875, -10.40625, -8.6953125, -6.984375, -5.2734375, -3.5625, -1.8515625, -0.140625, 1.5703125, 3.28125, 4.9921875, 6.703125, 8.4140625, 10.125, 11.8359375, 13.546875, 15.2578125, 16.96875, 18.6796875, 20.390625, 22.1015625, 23.8125, 25.5234375, 27.234375, 28.9453125, 30.65625, 32.3671875, 34.078125, 35.7890625, 37.5, 39.2109375, 40.921875, 42.6328125, 44.34375, 46.0546875, 47.765625, 49.4765625, 51.1875, 52.8984375, 54.609375, 56.3203125, 58.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 16.0, 12.0, 16.0, 24.0, 29.0, 41.0, 39.0, 48.0, 66.0, 74.0, 99.0, 119.0, 120.0, 140.0, 134.0, 185.0, 169.0, 202.0, 190.0, 220.0, 209.0, 187.0, 228.0, 188.0, 189.0, 170.0, 152.0, 130.0, 117.0, 107.0, 102.0, 79.0, 53.0, 38.0, 38.0, 33.0, 27.0, 18.0, 25.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.41552734375, -23.6123046875, -22.80908203125, -22.005859375, -21.20263671875, -20.3994140625, -19.59619140625, -18.79296875, -17.98974609375, -17.1865234375, -16.38330078125, -15.580078125, -14.77685546875, -13.9736328125, -13.17041015625, -12.3671875, -11.56396484375, -10.7607421875, -9.95751953125, -9.154296875, -8.35107421875, -7.5478515625, -6.74462890625, -5.94140625, -5.13818359375, -4.3349609375, -3.53173828125, -2.728515625, -1.92529296875, -1.1220703125, -0.31884765625, 0.484375, 1.28759765625, 2.0908203125, 2.89404296875, 3.697265625, 4.50048828125, 5.3037109375, 6.10693359375, 6.91015625, 7.71337890625, 8.5166015625, 9.31982421875, 10.123046875, 10.92626953125, 11.7294921875, 12.53271484375, 13.3359375, 14.13916015625, 14.9423828125, 15.74560546875, 16.548828125, 17.35205078125, 18.1552734375, 18.95849609375, 19.76171875, 20.56494140625, 21.3681640625, 22.17138671875, 22.974609375, 23.77783203125, 24.5810546875, 25.38427734375, 26.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 11.0, 8.0, 17.0, 11.0, 7.0, 13.0, 20.0, 12.0, 14.0, 28.0, 27.0, 26.0, 28.0, 32.0, 38.0, 41.0, 44.0, 39.0, 44.0, 33.0, 40.0, 38.0, 23.0, 43.0, 29.0, 28.0, 32.0, 38.0, 33.0, 18.0, 22.0, 15.0, 21.0, 11.0, 14.0, 9.0, 14.0, 13.0, 12.0, 5.0, 6.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-52.89725875854492, -51.18734359741211, -49.47743225097656, -47.76751708984375, -46.0576057434082, -44.34769058227539, -42.637779235839844, -40.92786407470703, -39.217952728271484, -37.50803756713867, -35.798126220703125, -34.08821105957031, -32.378299713134766, -30.668384552001953, -28.958473205566406, -27.248558044433594, -25.538644790649414, -23.828731536865234, -22.118818283081055, -20.408905029296875, -18.698991775512695, -16.989078521728516, -15.27916431427002, -13.56925106048584, -11.85933780670166, -10.14942455291748, -8.4395112991333, -6.729597568511963, -5.019684314727783, -3.3097705841064453, -1.5998573303222656, 0.11005592346191406, 1.8199691772460938, 3.5298824310302734, 5.239795684814453, 6.949709415435791, 8.659622192382812, 10.369536399841309, 12.079449653625488, 13.789362907409668, 15.499276161193848, 17.209190368652344, 18.919103622436523, 20.629016876220703, 22.338930130004883, 24.048843383789062, 25.758756637573242, 27.468669891357422, 29.1785831451416, 30.88849639892578, 32.598411560058594, 34.30832290649414, 36.01823806762695, 37.7281494140625, 39.43806457519531, 41.14797592163086, 42.85789108276367, 44.567806243896484, 46.27771759033203, 47.987632751464844, 49.69754409790039, 51.4074592590332, 53.11737060546875, 54.82728576660156, 56.53719711303711]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 11.0, 10.0, 13.0, 13.0, 13.0, 14.0, 12.0, 25.0, 29.0, 22.0, 29.0, 34.0, 42.0, 42.0, 42.0, 38.0, 31.0, 44.0, 46.0, 39.0, 44.0, 33.0, 41.0, 34.0, 30.0, 36.0, 36.0, 27.0, 27.0, 21.0, 17.0, 16.0, 22.0, 12.0, 8.0, 8.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.406978607177734, -54.4423713684082, -52.477760314941406, -50.513153076171875, -48.548545837402344, -46.58393859863281, -44.619327545166016, -42.654720306396484, -40.69010925292969, -38.725502014160156, -36.76089096069336, -34.79628372192383, -32.8316764831543, -30.867067337036133, -28.90245819091797, -26.937850952148438, -24.973243713378906, -23.008634567260742, -21.04402732849121, -19.079418182373047, -17.114810943603516, -15.150201797485352, -13.185592651367188, -11.22098445892334, -9.256376266479492, -7.2917680740356445, -5.327159404754639, -3.362550735473633, -1.3979425430297852, 0.5666656494140625, 2.5312747955322266, 4.495882987976074, 6.460487365722656, 8.425095558166504, 10.389703750610352, 12.354312896728516, 14.318921089172363, 16.28352928161621, 18.248138427734375, 20.212745666503906, 22.17735481262207, 24.141963958740234, 26.106571197509766, 28.07118034362793, 30.035789489746094, 32.000396728515625, 33.965003967285156, 35.92961502075195, 37.894222259521484, 39.858829498291016, 41.82344055175781, 43.788047790527344, 45.752655029296875, 47.717262268066406, 49.6818733215332, 51.646480560302734, 53.61109161376953, 55.57569885253906, 57.54030990600586, 59.50491714477539, 61.46952438354492, 63.43413543701172, 65.39874267578125, 67.36334991455078, 69.32795715332031]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 10.0, 16.0, 21.0, 30.0, 43.0, 86.0, 129.0, 215.0, 375.0, 558.0, 1076.0, 1997.0, 3360.0, 5758.0, 9964.0, 17244.0, 28364.0, 46069.0, 69920.0, 98552.0, 125818.0, 140518.0, 137160.0, 116620.0, 87808.0, 60409.0, 38963.0, 23937.0, 14071.0, 8159.0, 4787.0, 2788.0, 1610.0, 889.0, 478.0, 288.0, 171.0, 112.0, 66.0, 37.0, 29.0, 16.0, 9.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.675048828125, -23.81884765625, -22.962646484375, -22.1064453125, -21.250244140625, -20.39404296875, -19.537841796875, -18.681640625, -17.825439453125, -16.96923828125, -16.113037109375, -15.2568359375, -14.400634765625, -13.54443359375, -12.688232421875, -11.83203125, -10.975830078125, -10.11962890625, -9.263427734375, -8.4072265625, -7.551025390625, -6.69482421875, -5.838623046875, -4.982421875, -4.126220703125, -3.27001953125, -2.413818359375, -1.5576171875, -0.701416015625, 0.15478515625, 1.010986328125, 1.8671875, 2.723388671875, 3.57958984375, 4.435791015625, 5.2919921875, 6.148193359375, 7.00439453125, 7.860595703125, 8.716796875, 9.572998046875, 10.42919921875, 11.285400390625, 12.1416015625, 12.997802734375, 13.85400390625, 14.710205078125, 15.56640625, 16.422607421875, 17.27880859375, 18.135009765625, 18.9912109375, 19.847412109375, 20.70361328125, 21.559814453125, 22.416015625, 23.272216796875, 24.12841796875, 24.984619140625, 25.8408203125, 26.697021484375, 27.55322265625, 28.409423828125, 29.265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 10.0, 15.0, 14.0, 10.0, 14.0, 14.0, 22.0, 31.0, 23.0, 31.0, 34.0, 37.0, 41.0, 45.0, 40.0, 31.0, 42.0, 45.0, 39.0, 41.0, 36.0, 43.0, 33.0, 28.0, 38.0, 33.0, 31.0, 23.0, 23.0, 18.0, 14.0, 21.0, 16.0, 6.0, 8.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.03125, -55.04541015625, -53.0595703125, -51.07373046875, -49.087890625, -47.10205078125, -45.1162109375, -43.13037109375, -41.14453125, -39.15869140625, -37.1728515625, -35.18701171875, -33.201171875, -31.21533203125, -29.2294921875, -27.24365234375, -25.2578125, -23.27197265625, -21.2861328125, -19.30029296875, -17.314453125, -15.32861328125, -13.3427734375, -11.35693359375, -9.37109375, -7.38525390625, -5.3994140625, -3.41357421875, -1.427734375, 0.55810546875, 2.5439453125, 4.52978515625, 6.515625, 8.50146484375, 10.4873046875, 12.47314453125, 14.458984375, 16.44482421875, 18.4306640625, 20.41650390625, 22.40234375, 24.38818359375, 26.3740234375, 28.35986328125, 30.345703125, 32.33154296875, 34.3173828125, 36.30322265625, 38.2890625, 40.27490234375, 42.2607421875, 44.24658203125, 46.232421875, 48.21826171875, 50.2041015625, 52.18994140625, 54.17578125, 56.16162109375, 58.1474609375, 60.13330078125, 62.119140625, 64.10498046875, 66.0908203125, 68.07666015625, 70.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 24.0, 35.0, 49.0, 86.0, 116.0, 221.0, 411.0, 717.0, 1363.0, 2507.0, 4492.0, 8247.0, 15361.0, 29134.0, 192290.0, 717800.0, 35699.0, 18448.0, 9742.0, 5211.0, 2848.0, 1671.0, 879.0, 510.0, 245.0, 121.0, 106.0, 67.0, 35.0, 21.0, 15.0, 13.0, 4.0, 3.0, 11.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.625, -80.205078125, -77.78515625, -75.365234375, -72.9453125, -70.525390625, -68.10546875, -65.685546875, -63.265625, -60.845703125, -58.42578125, -56.005859375, -53.5859375, -51.166015625, -48.74609375, -46.326171875, -43.90625, -41.486328125, -39.06640625, -36.646484375, -34.2265625, -31.806640625, -29.38671875, -26.966796875, -24.546875, -22.126953125, -19.70703125, -17.287109375, -14.8671875, -12.447265625, -10.02734375, -7.607421875, -5.1875, -2.767578125, -0.34765625, 2.072265625, 4.4921875, 6.912109375, 9.33203125, 11.751953125, 14.171875, 16.591796875, 19.01171875, 21.431640625, 23.8515625, 26.271484375, 28.69140625, 31.111328125, 33.53125, 35.951171875, 38.37109375, 40.791015625, 43.2109375, 45.630859375, 48.05078125, 50.470703125, 52.890625, 55.310546875, 57.73046875, 60.150390625, 62.5703125, 64.990234375, 67.41015625, 69.830078125, 72.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 17.0, 15.0, 19.0, 24.0, 13.0, 28.0, 34.0, 32.0, 38.0, 36.0, 31.0, 35.0, 41.0, 37.0, 39.0, 23.0, 37.0, 26.0, 30.0, 45.0, 43.0, 28.0, 35.0, 20.0, 39.0, 27.0, 20.0, 21.0, 14.0, 17.0, 13.0, 15.0, 18.0, 4.0, 8.0, 6.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-37.46875, -36.17626953125, -34.8837890625, -33.59130859375, -32.298828125, -31.00634765625, -29.7138671875, -28.42138671875, -27.12890625, -25.83642578125, -24.5439453125, -23.25146484375, -21.958984375, -20.66650390625, -19.3740234375, -18.08154296875, -16.7890625, -15.49658203125, -14.2041015625, -12.91162109375, -11.619140625, -10.32666015625, -9.0341796875, -7.74169921875, -6.44921875, -5.15673828125, -3.8642578125, -2.57177734375, -1.279296875, 0.01318359375, 1.3056640625, 2.59814453125, 3.890625, 5.18310546875, 6.4755859375, 7.76806640625, 9.060546875, 10.35302734375, 11.6455078125, 12.93798828125, 14.23046875, 15.52294921875, 16.8154296875, 18.10791015625, 19.400390625, 20.69287109375, 21.9853515625, 23.27783203125, 24.5703125, 25.86279296875, 27.1552734375, 28.44775390625, 29.740234375, 31.03271484375, 32.3251953125, 33.61767578125, 34.91015625, 36.20263671875, 37.4951171875, 38.78759765625, 40.080078125, 41.37255859375, 42.6650390625, 43.95751953125, 45.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 22.0, 23.0, 28.0, 36.0, 43.0, 56.0, 92.0, 136.0, 213.0, 332.0, 549.0, 848.0, 1436.0, 2504.0, 4515.0, 8505.0, 16439.0, 35883.0, 672400.0, 244580.0, 28724.0, 13991.0, 7360.0, 4156.0, 2251.0, 1222.0, 782.0, 432.0, 274.0, 199.0, 141.0, 76.0, 79.0, 45.0, 30.0, 32.0, 30.0, 10.0, 14.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.18359375, -5.02099609375, -4.8583984375, -4.69580078125, -4.533203125, -4.37060546875, -4.2080078125, -4.04541015625, -3.8828125, -3.72021484375, -3.5576171875, -3.39501953125, -3.232421875, -3.06982421875, -2.9072265625, -2.74462890625, -2.58203125, -2.41943359375, -2.2568359375, -2.09423828125, -1.931640625, -1.76904296875, -1.6064453125, -1.44384765625, -1.28125, -1.11865234375, -0.9560546875, -0.79345703125, -0.630859375, -0.46826171875, -0.3056640625, -0.14306640625, 0.01953125, 0.18212890625, 0.3447265625, 0.50732421875, 0.669921875, 0.83251953125, 0.9951171875, 1.15771484375, 1.3203125, 1.48291015625, 1.6455078125, 1.80810546875, 1.970703125, 2.13330078125, 2.2958984375, 2.45849609375, 2.62109375, 2.78369140625, 2.9462890625, 3.10888671875, 3.271484375, 3.43408203125, 3.5966796875, 3.75927734375, 3.921875, 4.08447265625, 4.2470703125, 4.40966796875, 4.572265625, 4.73486328125, 4.8974609375, 5.06005859375, 5.22265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 5.0, 18.0, 23.0, 12.0, 25.0, 20.0, 34.0, 29.0, 51.0, 49.0, 44.0, 57.0, 57.0, 52.0, 62.0, 45.0, 51.0, 36.0, 35.0, 32.0, 33.0, 31.0, 25.0, 20.0, 17.0, 13.0, 12.0, 10.0, 8.0, 7.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00061798095703125, -0.0006001219153404236, -0.0005822628736495972, -0.0005644038319587708, -0.0005465447902679443, -0.0005286857485771179, -0.0005108267068862915, -0.0004929676651954651, -0.00047510862350463867, -0.00045724958181381226, -0.00043939054012298584, -0.0004215314984321594, -0.000403672456741333, -0.0003858134150505066, -0.0003679543733596802, -0.00035009533166885376, -0.00033223628997802734, -0.00031437724828720093, -0.0002965182065963745, -0.0002786591649055481, -0.0002608001232147217, -0.00024294108152389526, -0.00022508203983306885, -0.00020722299814224243, -0.00018936395645141602, -0.0001715049147605896, -0.00015364587306976318, -0.00013578683137893677, -0.00011792778968811035, -0.00010006874799728394, -8.220970630645752e-05, -6.43506646156311e-05, -4.649162292480469e-05, -2.863258123397827e-05, -1.0773539543151855e-05, 7.0855021476745605e-06, 2.4944543838500977e-05, 4.280358552932739e-05, 6.066262722015381e-05, 7.852166891098022e-05, 9.638071060180664e-05, 0.00011423975229263306, 0.00013209879398345947, 0.0001499578356742859, 0.0001678168773651123, 0.00018567591905593872, 0.00020353496074676514, 0.00022139400243759155, 0.00023925304412841797, 0.0002571120858192444, 0.0002749711275100708, 0.0002928301692008972, 0.00031068921089172363, 0.00032854825258255005, 0.00034640729427337646, 0.0003642663359642029, 0.0003821253776550293, 0.0003999844193458557, 0.00041784346103668213, 0.00043570250272750854, 0.00045356154441833496, 0.0004714205861091614, 0.0004892796277999878, 0.0005071386694908142, 0.0005249977111816406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 6.0, 10.0, 14.0, 22.0, 20.0, 36.0, 49.0, 73.0, 120.0, 156.0, 219.0, 280.0, 439.0, 610.0, 949.0, 1560.0, 2572.0, 4545.0, 8854.0, 18010.0, 36725.0, 74127.0, 136651.0, 208399.0, 219956.0, 156264.0, 87894.0, 43924.0, 21741.0, 10681.0, 5577.0, 2995.0, 1724.0, 1093.0, 694.0, 484.0, 300.0, 224.0, 163.0, 111.0, 87.0, 84.0, 38.0, 25.0, 20.0, 6.0, 12.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.525390625, -3.40838623046875, -3.2913818359375, -3.17437744140625, -3.057373046875, -2.94036865234375, -2.8233642578125, -2.70635986328125, -2.58935546875, -2.47235107421875, -2.3553466796875, -2.23834228515625, -2.121337890625, -2.00433349609375, -1.8873291015625, -1.77032470703125, -1.6533203125, -1.53631591796875, -1.4193115234375, -1.30230712890625, -1.185302734375, -1.06829833984375, -0.9512939453125, -0.83428955078125, -0.71728515625, -0.60028076171875, -0.4832763671875, -0.36627197265625, -0.249267578125, -0.13226318359375, -0.0152587890625, 0.10174560546875, 0.21875, 0.33575439453125, 0.4527587890625, 0.56976318359375, 0.686767578125, 0.80377197265625, 0.9207763671875, 1.03778076171875, 1.15478515625, 1.27178955078125, 1.3887939453125, 1.50579833984375, 1.622802734375, 1.73980712890625, 1.8568115234375, 1.97381591796875, 2.0908203125, 2.20782470703125, 2.3248291015625, 2.44183349609375, 2.558837890625, 2.67584228515625, 2.7928466796875, 2.90985107421875, 3.02685546875, 3.14385986328125, 3.2608642578125, 3.37786865234375, 3.494873046875, 3.61187744140625, 3.7288818359375, 3.84588623046875, 3.962890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 20.0, 18.0, 31.0, 31.0, 62.0, 77.0, 96.0, 113.0, 118.0, 102.0, 80.0, 61.0, 44.0, 28.0, 14.0, 14.0, 8.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4547882080078125, -1.404693603515625, -1.3545989990234375, -1.30450439453125, -1.2544097900390625, -1.204315185546875, -1.1542205810546875, -1.1041259765625, -1.0540313720703125, -1.003936767578125, -0.9538421630859375, -0.90374755859375, -0.8536529541015625, -0.803558349609375, -0.7534637451171875, -0.703369140625, -0.6532745361328125, -0.603179931640625, -0.5530853271484375, -0.50299072265625, -0.4528961181640625, -0.402801513671875, -0.3527069091796875, -0.3026123046875, -0.2525177001953125, -0.202423095703125, -0.1523284912109375, -0.10223388671875, -0.0521392822265625, -0.002044677734375, 0.0480499267578125, 0.09814453125, 0.1482391357421875, 0.198333740234375, 0.2484283447265625, 0.29852294921875, 0.3486175537109375, 0.398712158203125, 0.4488067626953125, 0.4989013671875, 0.5489959716796875, 0.599090576171875, 0.6491851806640625, 0.69927978515625, 0.7493743896484375, 0.799468994140625, 0.8495635986328125, 0.899658203125, 0.9497528076171875, 0.999847412109375, 1.0499420166015625, 1.10003662109375, 1.1501312255859375, 1.200225830078125, 1.2503204345703125, 1.3004150390625, 1.3505096435546875, 1.400604248046875, 1.4506988525390625, 1.50079345703125, 1.5508880615234375, 1.600982666015625, 1.6510772705078125, 1.701171875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 5.0, 10.0, 9.0, 11.0, 10.0, 14.0, 9.0, 14.0, 13.0, 16.0, 20.0, 30.0, 19.0, 21.0, 22.0, 35.0, 42.0, 35.0, 33.0, 39.0, 43.0, 37.0, 40.0, 37.0, 34.0, 31.0, 31.0, 34.0, 42.0, 29.0, 26.0, 28.0, 21.0, 20.0, 17.0, 16.0, 20.0, 5.0, 9.0, 16.0, 10.0, 14.0, 6.0, 1.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.85308837890625, -50.14957809448242, -48.44607162475586, -46.74256134033203, -45.0390510559082, -43.335540771484375, -41.63203430175781, -39.928524017333984, -38.225013732910156, -36.52150344848633, -34.817996978759766, -33.11448669433594, -31.41097640991211, -29.707468032836914, -28.00395965576172, -26.30044937133789, -24.596942901611328, -22.893434524536133, -21.189924240112305, -19.48641586303711, -17.78290557861328, -16.079397201538086, -14.37588882446289, -12.672379493713379, -10.968870162963867, -9.265360832214355, -7.561851978302002, -5.858343124389648, -4.154833793640137, -2.451324462890625, -0.7478160858154297, 0.955693244934082, 2.6592025756835938, 4.3627119064331055, 6.066220760345459, 7.7697296142578125, 9.473238945007324, 11.176748275756836, 12.880256652832031, 14.583765983581543, 16.287275314331055, 17.99078369140625, 19.694293975830078, 21.397802352905273, 23.10131072998047, 24.804821014404297, 26.508329391479492, 28.211837768554688, 29.915348052978516, 31.61885643005371, 33.322364807128906, 35.025875091552734, 36.72938537597656, 38.432891845703125, 40.13640213012695, 41.83991241455078, 43.543418884277344, 45.24692916870117, 46.950435638427734, 48.65394592285156, 50.35745620727539, 52.06096649169922, 53.76447296142578, 55.46798324584961, 57.17149353027344]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 8.0, 11.0, 16.0, 11.0, 14.0, 15.0, 25.0, 23.0, 27.0, 34.0, 32.0, 35.0, 45.0, 32.0, 46.0, 33.0, 45.0, 44.0, 37.0, 42.0, 30.0, 50.0, 30.0, 30.0, 40.0, 27.0, 32.0, 30.0, 19.0, 18.0, 13.0, 16.0, 24.0, 4.0, 14.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.00938415527344, -55.027931213378906, -53.04648208618164, -51.06502914428711, -49.083580017089844, -47.10212707519531, -45.12067413330078, -43.139225006103516, -41.15777587890625, -39.17632293701172, -37.19487380981445, -35.21342086791992, -33.231971740722656, -31.250518798828125, -29.269067764282227, -27.287616729736328, -25.306163787841797, -23.3247127532959, -21.34326171875, -19.36180877685547, -17.380359649658203, -15.398907661437988, -13.417455673217773, -11.436004638671875, -9.454553604125977, -7.473102569580078, -5.4916510581970215, -3.510199546813965, -1.5287485122680664, 0.45270252227783203, 2.434154510498047, 4.415605545043945, 6.397056579589844, 8.378507614135742, 10.35995864868164, 12.341410636901855, 14.322861671447754, 16.30431365966797, 18.285764694213867, 20.267215728759766, 22.248666763305664, 24.230117797851562, 26.21156883239746, 28.19301986694336, 30.17447280883789, 32.155921936035156, 34.13737487792969, 36.11882781982422, 38.100276947021484, 40.081729888916016, 42.06317901611328, 44.04463195800781, 46.02608108520508, 48.00753402709961, 49.988983154296875, 51.970436096191406, 53.95188903808594, 55.93334197998047, 57.914791107177734, 59.896244049072266, 61.87769317626953, 63.85914611816406, 65.8405990600586, 67.82205200195312, 69.80349731445312]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 18.0, 18.0, 43.0, 63.0, 101.0, 184.0, 282.0, 496.0, 893.0, 1534.0, 2670.0, 4636.0, 8102.0, 13836.0, 22784.0, 36187.0, 54462.0, 76886.0, 100217.0, 118705.0, 127268.0, 122384.0, 106039.0, 83518.0, 60636.0, 41409.0, 26437.0, 16125.0, 9627.0, 5593.0, 3118.0, 1877.0, 967.0, 598.0, 350.0, 201.0, 114.0, 67.0, 45.0, 22.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.96875, -53.17529296875, -51.3818359375, -49.58837890625, -47.794921875, -46.00146484375, -44.2080078125, -42.41455078125, -40.62109375, -38.82763671875, -37.0341796875, -35.24072265625, -33.447265625, -31.65380859375, -29.8603515625, -28.06689453125, -26.2734375, -24.47998046875, -22.6865234375, -20.89306640625, -19.099609375, -17.30615234375, -15.5126953125, -13.71923828125, -11.92578125, -10.13232421875, -8.3388671875, -6.54541015625, -4.751953125, -2.95849609375, -1.1650390625, 0.62841796875, 2.421875, 4.21533203125, 6.0087890625, 7.80224609375, 9.595703125, 11.38916015625, 13.1826171875, 14.97607421875, 16.76953125, 18.56298828125, 20.3564453125, 22.14990234375, 23.943359375, 25.73681640625, 27.5302734375, 29.32373046875, 31.1171875, 32.91064453125, 34.7041015625, 36.49755859375, 38.291015625, 40.08447265625, 41.8779296875, 43.67138671875, 45.46484375, 47.25830078125, 49.0517578125, 50.84521484375, 52.638671875, 54.43212890625, 56.2255859375, 58.01904296875, 59.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 10.0, 11.0, 13.0, 14.0, 10.0, 14.0, 12.0, 21.0, 29.0, 30.0, 30.0, 35.0, 35.0, 36.0, 38.0, 47.0, 40.0, 43.0, 45.0, 35.0, 39.0, 35.0, 44.0, 31.0, 29.0, 33.0, 38.0, 31.0, 31.0, 15.0, 16.0, 17.0, 20.0, 17.0, 9.0, 9.0, 10.0, 4.0, 7.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.71875, -52.81591796875, -50.9130859375, -49.01025390625, -47.107421875, -45.20458984375, -43.3017578125, -41.39892578125, -39.49609375, -37.59326171875, -35.6904296875, -33.78759765625, -31.884765625, -29.98193359375, -28.0791015625, -26.17626953125, -24.2734375, -22.37060546875, -20.4677734375, -18.56494140625, -16.662109375, -14.75927734375, -12.8564453125, -10.95361328125, -9.05078125, -7.14794921875, -5.2451171875, -3.34228515625, -1.439453125, 0.46337890625, 2.3662109375, 4.26904296875, 6.171875, 8.07470703125, 9.9775390625, 11.88037109375, 13.783203125, 15.68603515625, 17.5888671875, 19.49169921875, 21.39453125, 23.29736328125, 25.2001953125, 27.10302734375, 29.005859375, 30.90869140625, 32.8115234375, 34.71435546875, 36.6171875, 38.52001953125, 40.4228515625, 42.32568359375, 44.228515625, 46.13134765625, 48.0341796875, 49.93701171875, 51.83984375, 53.74267578125, 55.6455078125, 57.54833984375, 59.451171875, 61.35400390625, 63.2568359375, 65.15966796875, 67.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 15.0, 26.0, 26.0, 47.0, 93.0, 142.0, 245.0, 425.0, 748.0, 1379.0, 2651.0, 4791.0, 8485.0, 15129.0, 25978.0, 42115.0, 64208.0, 90517.0, 116813.0, 133375.0, 135467.0, 121817.0, 98133.0, 70803.0, 46488.0, 29235.0, 17300.0, 9924.0, 5457.0, 2992.0, 1692.0, 888.0, 457.0, 279.0, 161.0, 88.0, 59.0, 36.0, 28.0, 12.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-64.0625, -62.18505859375, -60.3076171875, -58.43017578125, -56.552734375, -54.67529296875, -52.7978515625, -50.92041015625, -49.04296875, -47.16552734375, -45.2880859375, -43.41064453125, -41.533203125, -39.65576171875, -37.7783203125, -35.90087890625, -34.0234375, -32.14599609375, -30.2685546875, -28.39111328125, -26.513671875, -24.63623046875, -22.7587890625, -20.88134765625, -19.00390625, -17.12646484375, -15.2490234375, -13.37158203125, -11.494140625, -9.61669921875, -7.7392578125, -5.86181640625, -3.984375, -2.10693359375, -0.2294921875, 1.64794921875, 3.525390625, 5.40283203125, 7.2802734375, 9.15771484375, 11.03515625, 12.91259765625, 14.7900390625, 16.66748046875, 18.544921875, 20.42236328125, 22.2998046875, 24.17724609375, 26.0546875, 27.93212890625, 29.8095703125, 31.68701171875, 33.564453125, 35.44189453125, 37.3193359375, 39.19677734375, 41.07421875, 42.95166015625, 44.8291015625, 46.70654296875, 48.583984375, 50.46142578125, 52.3388671875, 54.21630859375, 56.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 8.0, 10.0, 21.0, 12.0, 14.0, 34.0, 34.0, 35.0, 31.0, 31.0, 33.0, 39.0, 37.0, 41.0, 43.0, 40.0, 38.0, 46.0, 43.0, 39.0, 38.0, 35.0, 33.0, 26.0, 24.0, 34.0, 33.0, 23.0, 14.0, 17.0, 11.0, 14.0, 5.0, 11.0, 8.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.2587890625, -32.955078125, -31.6513671875, -30.34765625, -29.0439453125, -27.740234375, -26.4365234375, -25.1328125, -23.8291015625, -22.525390625, -21.2216796875, -19.91796875, -18.6142578125, -17.310546875, -16.0068359375, -14.703125, -13.3994140625, -12.095703125, -10.7919921875, -9.48828125, -8.1845703125, -6.880859375, -5.5771484375, -4.2734375, -2.9697265625, -1.666015625, -0.3623046875, 0.94140625, 2.2451171875, 3.548828125, 4.8525390625, 6.15625, 7.4599609375, 8.763671875, 10.0673828125, 11.37109375, 12.6748046875, 13.978515625, 15.2822265625, 16.5859375, 17.8896484375, 19.193359375, 20.4970703125, 21.80078125, 23.1044921875, 24.408203125, 25.7119140625, 27.015625, 28.3193359375, 29.623046875, 30.9267578125, 32.23046875, 33.5341796875, 34.837890625, 36.1416015625, 37.4453125, 38.7490234375, 40.052734375, 41.3564453125, 42.66015625, 43.9638671875, 45.267578125, 46.5712890625, 47.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 15.0, 18.0, 32.0, 45.0, 113.0, 222.0, 370.0, 724.0, 1563.0, 3602.0, 8526.0, 20222.0, 46512.0, 101883.0, 180054.0, 233613.0, 208294.0, 129957.0, 64116.0, 27944.0, 11632.0, 4889.0, 2116.0, 974.0, 500.0, 254.0, 135.0, 75.0, 53.0, 35.0, 21.0, 8.0, 10.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.9091796875, -38.724609375, -37.5400390625, -36.35546875, -35.1708984375, -33.986328125, -32.8017578125, -31.6171875, -30.4326171875, -29.248046875, -28.0634765625, -26.87890625, -25.6943359375, -24.509765625, -23.3251953125, -22.140625, -20.9560546875, -19.771484375, -18.5869140625, -17.40234375, -16.2177734375, -15.033203125, -13.8486328125, -12.6640625, -11.4794921875, -10.294921875, -9.1103515625, -7.92578125, -6.7412109375, -5.556640625, -4.3720703125, -3.1875, -2.0029296875, -0.818359375, 0.3662109375, 1.55078125, 2.7353515625, 3.919921875, 5.1044921875, 6.2890625, 7.4736328125, 8.658203125, 9.8427734375, 11.02734375, 12.2119140625, 13.396484375, 14.5810546875, 15.765625, 16.9501953125, 18.134765625, 19.3193359375, 20.50390625, 21.6884765625, 22.873046875, 24.0576171875, 25.2421875, 26.4267578125, 27.611328125, 28.7958984375, 29.98046875, 31.1650390625, 32.349609375, 33.5341796875, 34.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 11.0, 11.0, 13.0, 17.0, 30.0, 24.0, 26.0, 28.0, 24.0, 37.0, 34.0, 41.0, 42.0, 57.0, 44.0, 52.0, 46.0, 46.0, 37.0, 43.0, 41.0, 34.0, 36.0, 27.0, 25.0, 19.0, 21.0, 20.0, 20.0, 16.0, 10.0, 7.0, 9.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.002246856689453125, -0.0021781325340270996, -0.0021094083786010742, -0.002040684223175049, -0.0019719600677490234, -0.001903235912322998, -0.0018345117568969727, -0.0017657876014709473, -0.0016970634460449219, -0.0016283392906188965, -0.001559615135192871, -0.0014908909797668457, -0.0014221668243408203, -0.001353442668914795, -0.0012847185134887695, -0.0012159943580627441, -0.0011472702026367188, -0.0010785460472106934, -0.001009821891784668, -0.0009410977363586426, -0.0008723735809326172, -0.0008036494255065918, -0.0007349252700805664, -0.000666201114654541, -0.0005974769592285156, -0.0005287528038024902, -0.00046002864837646484, -0.00039130449295043945, -0.00032258033752441406, -0.00025385618209838867, -0.00018513202667236328, -0.00011640787124633789, -4.76837158203125e-05, 2.104043960571289e-05, 8.976459503173828e-05, 0.00015848875045776367, 0.00022721290588378906, 0.00029593706130981445, 0.00036466121673583984, 0.00043338537216186523, 0.0005021095275878906, 0.000570833683013916, 0.0006395578384399414, 0.0007082819938659668, 0.0007770061492919922, 0.0008457303047180176, 0.000914454460144043, 0.0009831786155700684, 0.0010519027709960938, 0.0011206269264221191, 0.0011893510818481445, 0.00125807523727417, 0.0013267993927001953, 0.0013955235481262207, 0.001464247703552246, 0.0015329718589782715, 0.0016016960144042969, 0.0016704201698303223, 0.0017391443252563477, 0.001807868480682373, 0.0018765926361083984, 0.0019453167915344238, 0.0020140409469604492, 0.0020827651023864746, 0.0021514892578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 14.0, 28.0, 39.0, 75.0, 90.0, 178.0, 251.0, 463.0, 683.0, 1144.0, 1897.0, 3243.0, 5687.0, 9818.0, 16813.0, 30027.0, 49888.0, 79978.0, 115233.0, 145215.0, 155958.0, 140039.0, 108431.0, 73550.0, 45660.0, 26973.0, 15566.0, 8969.0, 5175.0, 2985.0, 1754.0, 1064.0, 636.0, 366.0, 259.0, 149.0, 86.0, 58.0, 29.0, 19.0, 23.0, 4.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.0830078125, -23.291015625, -22.4990234375, -21.70703125, -20.9150390625, -20.123046875, -19.3310546875, -18.5390625, -17.7470703125, -16.955078125, -16.1630859375, -15.37109375, -14.5791015625, -13.787109375, -12.9951171875, -12.203125, -11.4111328125, -10.619140625, -9.8271484375, -9.03515625, -8.2431640625, -7.451171875, -6.6591796875, -5.8671875, -5.0751953125, -4.283203125, -3.4912109375, -2.69921875, -1.9072265625, -1.115234375, -0.3232421875, 0.46875, 1.2607421875, 2.052734375, 2.8447265625, 3.63671875, 4.4287109375, 5.220703125, 6.0126953125, 6.8046875, 7.5966796875, 8.388671875, 9.1806640625, 9.97265625, 10.7646484375, 11.556640625, 12.3486328125, 13.140625, 13.9326171875, 14.724609375, 15.5166015625, 16.30859375, 17.1005859375, 17.892578125, 18.6845703125, 19.4765625, 20.2685546875, 21.060546875, 21.8525390625, 22.64453125, 23.4365234375, 24.228515625, 25.0205078125, 25.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 21.0, 21.0, 40.0, 29.0, 42.0, 58.0, 55.0, 67.0, 85.0, 72.0, 69.0, 66.0, 70.0, 54.0, 56.0, 39.0, 26.0, 27.0, 18.0, 20.0, 10.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.4757080078125, -11.037353515625, -10.5989990234375, -10.16064453125, -9.7222900390625, -9.283935546875, -8.8455810546875, -8.4072265625, -7.9688720703125, -7.530517578125, -7.0921630859375, -6.65380859375, -6.2154541015625, -5.777099609375, -5.3387451171875, -4.900390625, -4.4620361328125, -4.023681640625, -3.5853271484375, -3.14697265625, -2.7086181640625, -2.270263671875, -1.8319091796875, -1.3935546875, -0.9552001953125, -0.516845703125, -0.0784912109375, 0.35986328125, 0.7982177734375, 1.236572265625, 1.6749267578125, 2.11328125, 2.5516357421875, 2.989990234375, 3.4283447265625, 3.86669921875, 4.3050537109375, 4.743408203125, 5.1817626953125, 5.6201171875, 6.0584716796875, 6.496826171875, 6.9351806640625, 7.37353515625, 7.8118896484375, 8.250244140625, 8.6885986328125, 9.126953125, 9.5653076171875, 10.003662109375, 10.4420166015625, 10.88037109375, 11.3187255859375, 11.757080078125, 12.1954345703125, 12.6337890625, 13.0721435546875, 13.510498046875, 13.9488525390625, 14.38720703125, 14.8255615234375, 15.263916015625, 15.7022705078125, 16.140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 11.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 18.0, 27.0, 42.0, 33.0, 30.0, 33.0, 45.0, 55.0, 30.0, 37.0, 46.0, 40.0, 45.0, 36.0, 42.0, 36.0, 36.0, 21.0, 28.0, 25.0, 28.0, 18.0, 29.0, 18.0, 10.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 10.0, 2.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.68506622314453, -49.852203369140625, -48.01934051513672, -46.18647384643555, -44.35361099243164, -42.520748138427734, -40.68788528442383, -38.855018615722656, -37.02215576171875, -35.189292907714844, -33.35643005371094, -31.5235652923584, -29.69070053100586, -27.857837677001953, -26.024974822998047, -24.192110061645508, -22.3592472076416, -20.526384353637695, -18.693519592285156, -16.86065673828125, -15.027791976928711, -13.194929122924805, -11.362065315246582, -9.52920150756836, -7.696337699890137, -5.863473892211914, -4.030610084533691, -2.197746753692627, -0.3648829460144043, 1.4679803848266602, 3.300844192504883, 5.1337080001831055, 6.966571807861328, 8.79943561553955, 10.632299423217773, 12.46516227722168, 14.298027038574219, 16.130889892578125, 17.96375274658203, 19.79661750793457, 21.62948226928711, 23.462345123291016, 25.295209884643555, 27.12807273864746, 28.9609375, 30.793800354003906, 32.62666320800781, 34.45952606201172, 36.292388916015625, 38.12525177001953, 39.95811462402344, 41.79098129272461, 43.623844146728516, 45.45670700073242, 47.28956985473633, 49.1224365234375, 50.955299377441406, 52.78816223144531, 54.62102508544922, 56.45389175415039, 58.2867546081543, 60.1196174621582, 61.95248031616211, 63.78534698486328, 65.61820983886719]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 12.0, 10.0, 16.0, 13.0, 15.0, 12.0, 25.0, 18.0, 22.0, 27.0, 30.0, 36.0, 31.0, 30.0, 38.0, 45.0, 37.0, 35.0, 32.0, 30.0, 37.0, 48.0, 43.0, 36.0, 26.0, 22.0, 24.0, 22.0, 29.0, 24.0, 20.0, 14.0, 18.0, 20.0, 16.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-57.952789306640625, -56.12928009033203, -54.30577087402344, -52.482261657714844, -50.65875244140625, -48.835243225097656, -47.01173400878906, -45.188228607177734, -43.36471939086914, -41.54121017456055, -39.71770095825195, -37.89419174194336, -36.070682525634766, -34.24717712402344, -32.423667907714844, -30.60015869140625, -28.776647567749023, -26.95313835144043, -25.129629135131836, -23.306121826171875, -21.48261260986328, -19.659103393554688, -17.835594177246094, -16.0120849609375, -14.188576698303223, -12.365067481994629, -10.541559219360352, -8.718050003051758, -6.894541263580322, -5.071032524108887, -3.247523307800293, -1.4240150451660156, 0.3994941711425781, 2.2230029106140137, 4.046511650085449, 5.870020866394043, 7.6935296058654785, 9.517038345336914, 11.340547561645508, 13.164055824279785, 14.987565040588379, 16.811073303222656, 18.63458251953125, 20.458091735839844, 22.281600952148438, 24.10511016845703, 25.928619384765625, 27.752126693725586, 29.57563591003418, 31.399145126342773, 33.222652435302734, 35.04616165161133, 36.86967086791992, 38.693180084228516, 40.51668930053711, 42.3401985168457, 44.1637077331543, 45.98721694946289, 47.810726165771484, 49.63423538208008, 51.45774459838867, 53.28125, 55.104759216308594, 56.92826843261719, 58.75177764892578]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 9.0, 7.0, 12.0, 16.0, 41.0, 56.0, 114.0, 171.0, 276.0, 518.0, 845.0, 1430.0, 2432.0, 3982.0, 6618.0, 11230.0, 18183.0, 29285.0, 47799.0, 75373.0, 115975.0, 171795.0, 244658.0, 327657.0, 406329.0, 464337.0, 480116.0, 448525.0, 383491.0, 300464.0, 221609.0, 154049.0, 102335.0, 66236.0, 41896.0, 26034.0, 16115.0, 9533.0, 6024.0, 3466.0, 2147.0, 1237.0, 791.0, 462.0, 261.0, 158.0, 80.0, 50.0, 26.0, 9.0, 9.0, 7.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-46.3125, -44.83544921875, -43.3583984375, -41.88134765625, -40.404296875, -38.92724609375, -37.4501953125, -35.97314453125, -34.49609375, -33.01904296875, -31.5419921875, -30.06494140625, -28.587890625, -27.11083984375, -25.6337890625, -24.15673828125, -22.6796875, -21.20263671875, -19.7255859375, -18.24853515625, -16.771484375, -15.29443359375, -13.8173828125, -12.34033203125, -10.86328125, -9.38623046875, -7.9091796875, -6.43212890625, -4.955078125, -3.47802734375, -2.0009765625, -0.52392578125, 0.953125, 2.43017578125, 3.9072265625, 5.38427734375, 6.861328125, 8.33837890625, 9.8154296875, 11.29248046875, 12.76953125, 14.24658203125, 15.7236328125, 17.20068359375, 18.677734375, 20.15478515625, 21.6318359375, 23.10888671875, 24.5859375, 26.06298828125, 27.5400390625, 29.01708984375, 30.494140625, 31.97119140625, 33.4482421875, 34.92529296875, 36.40234375, 37.87939453125, 39.3564453125, 40.83349609375, 42.310546875, 43.78759765625, 45.2646484375, 46.74169921875, 48.21875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 8.0, 9.0, 11.0, 14.0, 13.0, 15.0, 9.0, 20.0, 20.0, 20.0, 18.0, 32.0, 31.0, 24.0, 35.0, 37.0, 36.0, 44.0, 36.0, 38.0, 25.0, 36.0, 35.0, 52.0, 37.0, 32.0, 37.0, 23.0, 21.0, 23.0, 25.0, 22.0, 19.0, 16.0, 19.0, 17.0, 20.0, 8.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.96875, -47.3779296875, -45.787109375, -44.1962890625, -42.60546875, -41.0146484375, -39.423828125, -37.8330078125, -36.2421875, -34.6513671875, -33.060546875, -31.4697265625, -29.87890625, -28.2880859375, -26.697265625, -25.1064453125, -23.515625, -21.9248046875, -20.333984375, -18.7431640625, -17.15234375, -15.5615234375, -13.970703125, -12.3798828125, -10.7890625, -9.1982421875, -7.607421875, -6.0166015625, -4.42578125, -2.8349609375, -1.244140625, 0.3466796875, 1.9375, 3.5283203125, 5.119140625, 6.7099609375, 8.30078125, 9.8916015625, 11.482421875, 13.0732421875, 14.6640625, 16.2548828125, 17.845703125, 19.4365234375, 21.02734375, 22.6181640625, 24.208984375, 25.7998046875, 27.390625, 28.9814453125, 30.572265625, 32.1630859375, 33.75390625, 35.3447265625, 36.935546875, 38.5263671875, 40.1171875, 41.7080078125, 43.298828125, 44.8896484375, 46.48046875, 48.0712890625, 49.662109375, 51.2529296875, 52.84375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 12.0, 18.0, 41.0, 39.0, 75.0, 123.0, 193.0, 360.0, 598.0, 1028.0, 1830.0, 2987.0, 5234.0, 8709.0, 14719.0, 24372.0, 39141.0, 62090.0, 95903.0, 142267.0, 203593.0, 273915.0, 347688.0, 412171.0, 447502.0, 448860.0, 413315.0, 352027.0, 278462.0, 206765.0, 145842.0, 98444.0, 64030.0, 40405.0, 24981.0, 14831.0, 8919.0, 5273.0, 3100.0, 1875.0, 1003.0, 621.0, 403.0, 215.0, 113.0, 81.0, 44.0, 21.0, 23.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.25, -50.66796875, -49.0859375, -47.50390625, -45.921875, -44.33984375, -42.7578125, -41.17578125, -39.59375, -38.01171875, -36.4296875, -34.84765625, -33.265625, -31.68359375, -30.1015625, -28.51953125, -26.9375, -25.35546875, -23.7734375, -22.19140625, -20.609375, -19.02734375, -17.4453125, -15.86328125, -14.28125, -12.69921875, -11.1171875, -9.53515625, -7.953125, -6.37109375, -4.7890625, -3.20703125, -1.625, -0.04296875, 1.5390625, 3.12109375, 4.703125, 6.28515625, 7.8671875, 9.44921875, 11.03125, 12.61328125, 14.1953125, 15.77734375, 17.359375, 18.94140625, 20.5234375, 22.10546875, 23.6875, 25.26953125, 26.8515625, 28.43359375, 30.015625, 31.59765625, 33.1796875, 34.76171875, 36.34375, 37.92578125, 39.5078125, 41.08984375, 42.671875, 44.25390625, 45.8359375, 47.41796875, 49.0]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 15.0, 17.0, 23.0, 32.0, 36.0, 40.0, 61.0, 70.0, 92.0, 87.0, 102.0, 132.0, 132.0, 143.0, 167.0, 183.0, 187.0, 176.0, 192.0, 185.0, 160.0, 207.0, 170.0, 165.0, 148.0, 154.0, 135.0, 117.0, 119.0, 86.0, 84.0, 73.0, 80.0, 61.0, 38.0, 38.0, 31.0, 17.0, 11.0, 13.0, 11.0, 7.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.189697265625, -20.47314453125, -19.756591796875, -19.0400390625, -18.323486328125, -17.60693359375, -16.890380859375, -16.173828125, -15.457275390625, -14.74072265625, -14.024169921875, -13.3076171875, -12.591064453125, -11.87451171875, -11.157958984375, -10.44140625, -9.724853515625, -9.00830078125, -8.291748046875, -7.5751953125, -6.858642578125, -6.14208984375, -5.425537109375, -4.708984375, -3.992431640625, -3.27587890625, -2.559326171875, -1.8427734375, -1.126220703125, -0.40966796875, 0.306884765625, 1.0234375, 1.739990234375, 2.45654296875, 3.173095703125, 3.8896484375, 4.606201171875, 5.32275390625, 6.039306640625, 6.755859375, 7.472412109375, 8.18896484375, 8.905517578125, 9.6220703125, 10.338623046875, 11.05517578125, 11.771728515625, 12.48828125, 13.204833984375, 13.92138671875, 14.637939453125, 15.3544921875, 16.071044921875, 16.78759765625, 17.504150390625, 18.220703125, 18.937255859375, 19.65380859375, 20.370361328125, 21.0869140625, 21.803466796875, 22.52001953125, 23.236572265625, 23.953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 13.0, 10.0, 18.0, 17.0, 9.0, 15.0, 25.0, 28.0, 32.0, 36.0, 36.0, 41.0, 38.0, 43.0, 42.0, 45.0, 46.0, 54.0, 49.0, 43.0, 26.0, 32.0, 42.0, 29.0, 30.0, 16.0, 25.0, 22.0, 21.0, 18.0, 13.0, 11.0, 19.0, 8.0, 5.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.52864074707031, -57.64255905151367, -55.75647735595703, -53.870399475097656, -51.984317779541016, -50.098236083984375, -48.212154388427734, -46.326072692871094, -44.43999099731445, -42.55390930175781, -40.66782760620117, -38.78174591064453, -36.895668029785156, -35.009586334228516, -33.123504638671875, -31.237422943115234, -29.351343154907227, -27.465261459350586, -25.579181671142578, -23.693099975585938, -21.807018280029297, -19.920936584472656, -18.03485679626465, -16.148775100708008, -14.262694358825684, -12.37661361694336, -10.490531921386719, -8.604451179504395, -6.718369960784912, -4.83228874206543, -2.9462080001831055, -1.0601263046264648, 0.8259544372558594, 2.712035655975342, 4.598116874694824, 6.484197616577148, 8.370279312133789, 10.256360054016113, 12.142440795898438, 14.028522491455078, 15.914603233337402, 17.800683975219727, 19.686765670776367, 21.572845458984375, 23.458927154541016, 25.345008850097656, 27.231090545654297, 29.117172241210938, 31.003252029418945, 32.88933181762695, 34.775413513183594, 36.661495208740234, 38.547576904296875, 40.433658599853516, 42.319740295410156, 44.20581817626953, 46.09189987182617, 47.97798156738281, 49.86406326293945, 51.750144958496094, 53.63622283935547, 55.52230453491211, 57.40838623046875, 59.29446792602539, 61.18054962158203]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 12.0, 21.0, 17.0, 21.0, 18.0, 21.0, 26.0, 34.0, 35.0, 25.0, 49.0, 34.0, 36.0, 36.0, 48.0, 48.0, 48.0, 23.0, 33.0, 30.0, 29.0, 40.0, 31.0, 30.0, 37.0, 20.0, 21.0, 26.0, 17.0, 22.0, 14.0, 10.0, 9.0, 12.0, 7.0, 4.0, 2.0, 11.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-64.69147491455078, -62.7783203125, -60.86516571044922, -58.95201110839844, -57.038856506347656, -55.125701904296875, -53.21254348754883, -51.29938888549805, -49.386234283447266, -47.473079681396484, -45.5599250793457, -43.64677047729492, -41.733612060546875, -39.820457458496094, -37.90730285644531, -35.99414825439453, -34.08099365234375, -32.16783905029297, -30.254684448242188, -28.341527938842773, -26.428373336791992, -24.51521873474121, -22.602062225341797, -20.688907623291016, -18.775753021240234, -16.862598419189453, -14.949442863464355, -13.036287307739258, -11.123132705688477, -9.209978103637695, -7.296822547912598, -5.3836669921875, -3.4705162048339844, -1.557361125946045, 0.35579395294189453, 2.268949031829834, 4.182104110717773, 6.095258712768555, 8.008414268493652, 9.92156982421875, 11.834724426269531, 13.747879028320312, 15.66103458404541, 17.574190139770508, 19.48734474182129, 21.40049934387207, 23.313655853271484, 25.226810455322266, 27.139965057373047, 29.053119659423828, 30.96627426147461, 32.87942886352539, 34.79258728027344, 36.70574188232422, 38.618896484375, 40.53205108642578, 42.44520568847656, 44.358360290527344, 46.271514892578125, 48.184669494628906, 50.09782409667969, 52.01097869873047, 53.924137115478516, 55.8372917175293, 57.75044631958008]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 15.0, 21.0, 42.0, 52.0, 110.0, 204.0, 287.0, 446.0, 667.0, 1074.0, 1732.0, 2695.0, 4164.0, 6549.0, 9802.0, 14721.0, 21784.0, 31119.0, 43144.0, 56914.0, 72665.0, 87571.0, 98149.0, 103846.0, 101154.0, 92112.0, 77995.0, 62614.0, 47788.0, 34640.0, 24810.0, 17211.0, 11566.0, 7461.0, 4902.0, 3037.0, 2011.0, 1298.0, 807.0, 497.0, 305.0, 206.0, 139.0, 88.0, 50.0, 31.0, 23.0, 7.0, 8.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-18.328125, -17.74951171875, -17.1708984375, -16.59228515625, -16.013671875, -15.43505859375, -14.8564453125, -14.27783203125, -13.69921875, -13.12060546875, -12.5419921875, -11.96337890625, -11.384765625, -10.80615234375, -10.2275390625, -9.64892578125, -9.0703125, -8.49169921875, -7.9130859375, -7.33447265625, -6.755859375, -6.17724609375, -5.5986328125, -5.02001953125, -4.44140625, -3.86279296875, -3.2841796875, -2.70556640625, -2.126953125, -1.54833984375, -0.9697265625, -0.39111328125, 0.1875, 0.76611328125, 1.3447265625, 1.92333984375, 2.501953125, 3.08056640625, 3.6591796875, 4.23779296875, 4.81640625, 5.39501953125, 5.9736328125, 6.55224609375, 7.130859375, 7.70947265625, 8.2880859375, 8.86669921875, 9.4453125, 10.02392578125, 10.6025390625, 11.18115234375, 11.759765625, 12.33837890625, 12.9169921875, 13.49560546875, 14.07421875, 14.65283203125, 15.2314453125, 15.81005859375, 16.388671875, 16.96728515625, 17.5458984375, 18.12451171875, 18.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 8.0, 13.0, 18.0, 19.0, 21.0, 20.0, 19.0, 22.0, 35.0, 33.0, 27.0, 52.0, 30.0, 36.0, 40.0, 38.0, 54.0, 44.0, 29.0, 26.0, 36.0, 30.0, 37.0, 34.0, 24.0, 40.0, 23.0, 21.0, 24.0, 20.0, 16.0, 21.0, 9.0, 9.0, 14.0, 3.0, 7.0, 3.0, 4.0, 11.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-65.375, -63.4619140625, -61.548828125, -59.6357421875, -57.72265625, -55.8095703125, -53.896484375, -51.9833984375, -50.0703125, -48.1572265625, -46.244140625, -44.3310546875, -42.41796875, -40.5048828125, -38.591796875, -36.6787109375, -34.765625, -32.8525390625, -30.939453125, -29.0263671875, -27.11328125, -25.2001953125, -23.287109375, -21.3740234375, -19.4609375, -17.5478515625, -15.634765625, -13.7216796875, -11.80859375, -9.8955078125, -7.982421875, -6.0693359375, -4.15625, -2.2431640625, -0.330078125, 1.5830078125, 3.49609375, 5.4091796875, 7.322265625, 9.2353515625, 11.1484375, 13.0615234375, 14.974609375, 16.8876953125, 18.80078125, 20.7138671875, 22.626953125, 24.5400390625, 26.453125, 28.3662109375, 30.279296875, 32.1923828125, 34.10546875, 36.0185546875, 37.931640625, 39.8447265625, 41.7578125, 43.6708984375, 45.583984375, 47.4970703125, 49.41015625, 51.3232421875, 53.236328125, 55.1494140625, 57.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 29.0, 20.0, 47.0, 68.0, 115.0, 166.0, 271.0, 439.0, 714.0, 1163.0, 1796.0, 3071.0, 5055.0, 8535.0, 14536.0, 24678.0, 65859.0, 822944.0, 44245.0, 22326.0, 12982.0, 7681.0, 4560.0, 2755.0, 1676.0, 1004.0, 679.0, 361.0, 249.0, 153.0, 108.0, 62.0, 43.0, 32.0, 29.0, 17.0, 13.0, 10.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.75146484375, -60.7529296875, -58.75439453125, -56.755859375, -54.75732421875, -52.7587890625, -50.76025390625, -48.76171875, -46.76318359375, -44.7646484375, -42.76611328125, -40.767578125, -38.76904296875, -36.7705078125, -34.77197265625, -32.7734375, -30.77490234375, -28.7763671875, -26.77783203125, -24.779296875, -22.78076171875, -20.7822265625, -18.78369140625, -16.78515625, -14.78662109375, -12.7880859375, -10.78955078125, -8.791015625, -6.79248046875, -4.7939453125, -2.79541015625, -0.796875, 1.20166015625, 3.2001953125, 5.19873046875, 7.197265625, 9.19580078125, 11.1943359375, 13.19287109375, 15.19140625, 17.18994140625, 19.1884765625, 21.18701171875, 23.185546875, 25.18408203125, 27.1826171875, 29.18115234375, 31.1796875, 33.17822265625, 35.1767578125, 37.17529296875, 39.173828125, 41.17236328125, 43.1708984375, 45.16943359375, 47.16796875, 49.16650390625, 51.1650390625, 53.16357421875, 55.162109375, 57.16064453125, 59.1591796875, 61.15771484375, 63.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 7.0, 3.0, 5.0, 12.0, 12.0, 16.0, 20.0, 20.0, 15.0, 15.0, 16.0, 33.0, 22.0, 32.0, 33.0, 28.0, 31.0, 42.0, 46.0, 42.0, 39.0, 36.0, 44.0, 46.0, 29.0, 36.0, 34.0, 31.0, 35.0, 24.0, 36.0, 11.0, 23.0, 16.0, 16.0, 15.0, 14.0, 11.0, 13.0, 8.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-36.5, -35.20703125, -33.9140625, -32.62109375, -31.328125, -30.03515625, -28.7421875, -27.44921875, -26.15625, -24.86328125, -23.5703125, -22.27734375, -20.984375, -19.69140625, -18.3984375, -17.10546875, -15.8125, -14.51953125, -13.2265625, -11.93359375, -10.640625, -9.34765625, -8.0546875, -6.76171875, -5.46875, -4.17578125, -2.8828125, -1.58984375, -0.296875, 0.99609375, 2.2890625, 3.58203125, 4.875, 6.16796875, 7.4609375, 8.75390625, 10.046875, 11.33984375, 12.6328125, 13.92578125, 15.21875, 16.51171875, 17.8046875, 19.09765625, 20.390625, 21.68359375, 22.9765625, 24.26953125, 25.5625, 26.85546875, 28.1484375, 29.44140625, 30.734375, 32.02734375, 33.3203125, 34.61328125, 35.90625, 37.19921875, 38.4921875, 39.78515625, 41.078125, 42.37109375, 43.6640625, 44.95703125, 46.25]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 6.0, 13.0, 16.0, 20.0, 20.0, 28.0, 30.0, 54.0, 55.0, 85.0, 135.0, 197.0, 307.0, 415.0, 587.0, 875.0, 1283.0, 1981.0, 3019.0, 4365.0, 6915.0, 10843.0, 18394.0, 34143.0, 428441.0, 451171.0, 35013.0, 18489.0, 11139.0, 6921.0, 4500.0, 2956.0, 1949.0, 1310.0, 900.0, 582.0, 412.0, 292.0, 216.0, 153.0, 93.0, 56.0, 37.0, 31.0, 28.0, 22.0, 21.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.021484375, -2.924041748046875, -2.82659912109375, -2.729156494140625, -2.6317138671875, -2.534271240234375, -2.43682861328125, -2.339385986328125, -2.241943359375, -2.144500732421875, -2.04705810546875, -1.949615478515625, -1.8521728515625, -1.754730224609375, -1.65728759765625, -1.559844970703125, -1.46240234375, -1.364959716796875, -1.26751708984375, -1.170074462890625, -1.0726318359375, -0.975189208984375, -0.87774658203125, -0.780303955078125, -0.682861328125, -0.585418701171875, -0.48797607421875, -0.390533447265625, -0.2930908203125, -0.195648193359375, -0.09820556640625, -0.000762939453125, 0.0966796875, 0.194122314453125, 0.29156494140625, 0.389007568359375, 0.4864501953125, 0.583892822265625, 0.68133544921875, 0.778778076171875, 0.876220703125, 0.973663330078125, 1.07110595703125, 1.168548583984375, 1.2659912109375, 1.363433837890625, 1.46087646484375, 1.558319091796875, 1.65576171875, 1.753204345703125, 1.85064697265625, 1.948089599609375, 2.0455322265625, 2.142974853515625, 2.24041748046875, 2.337860107421875, 2.435302734375, 2.532745361328125, 2.63018798828125, 2.727630615234375, 2.8250732421875, 2.922515869140625, 3.01995849609375, 3.117401123046875, 3.21484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 3.0, 10.0, 8.0, 11.0, 16.0, 13.0, 20.0, 38.0, 41.0, 43.0, 49.0, 49.0, 70.0, 67.0, 55.0, 72.0, 68.0, 66.0, 60.0, 49.0, 34.0, 32.0, 21.0, 20.0, 19.0, 14.0, 6.0, 7.0, 8.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006780624389648438, -0.0006585270166397095, -0.0006389915943145752, -0.0006194561719894409, -0.0005999207496643066, -0.0005803853273391724, -0.0005608499050140381, -0.0005413144826889038, -0.0005217790603637695, -0.0005022436380386353, -0.000482708215713501, -0.0004631727933883667, -0.0004436373710632324, -0.00042410194873809814, -0.00040456652641296387, -0.0003850311040878296, -0.0003654956817626953, -0.00034596025943756104, -0.00032642483711242676, -0.0003068894147872925, -0.0002873539924621582, -0.0002678185701370239, -0.00024828314781188965, -0.00022874772548675537, -0.0002092123031616211, -0.00018967688083648682, -0.00017014145851135254, -0.00015060603618621826, -0.00013107061386108398, -0.00011153519153594971, -9.199976921081543e-05, -7.246434688568115e-05, -5.2928924560546875e-05, -3.33935022354126e-05, -1.385807991027832e-05, 5.677342414855957e-06, 2.5212764739990234e-05, 4.474818706512451e-05, 6.428360939025879e-05, 8.381903171539307e-05, 0.00010335445404052734, 0.00012288987636566162, 0.0001424252986907959, 0.00016196072101593018, 0.00018149614334106445, 0.00020103156566619873, 0.000220566987991333, 0.00024010241031646729, 0.00025963783264160156, 0.00027917325496673584, 0.0002987086772918701, 0.0003182440996170044, 0.00033777952194213867, 0.00035731494426727295, 0.0003768503665924072, 0.0003963857889175415, 0.0004159212112426758, 0.00043545663356781006, 0.00045499205589294434, 0.0004745274782180786, 0.0004940629005432129, 0.0005135983228683472, 0.0005331337451934814, 0.0005526691675186157, 0.00057220458984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 17.0, 23.0, 42.0, 58.0, 122.0, 160.0, 317.0, 476.0, 899.0, 1422.0, 2460.0, 4068.0, 7191.0, 12502.0, 21338.0, 36166.0, 58505.0, 87191.0, 118613.0, 141771.0, 146817.0, 130243.0, 100603.0, 69246.0, 44349.0, 26678.0, 15494.0, 8971.0, 5285.0, 3039.0, 1759.0, 1077.0, 636.0, 409.0, 240.0, 131.0, 81.0, 54.0, 38.0, 14.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.57421875, -2.491729736328125, -2.40924072265625, -2.326751708984375, -2.2442626953125, -2.161773681640625, -2.07928466796875, -1.996795654296875, -1.914306640625, -1.831817626953125, -1.74932861328125, -1.666839599609375, -1.5843505859375, -1.501861572265625, -1.41937255859375, -1.336883544921875, -1.25439453125, -1.171905517578125, -1.08941650390625, -1.006927490234375, -0.9244384765625, -0.841949462890625, -0.75946044921875, -0.676971435546875, -0.594482421875, -0.511993408203125, -0.42950439453125, -0.347015380859375, -0.2645263671875, -0.182037353515625, -0.09954833984375, -0.017059326171875, 0.0654296875, 0.147918701171875, 0.23040771484375, 0.312896728515625, 0.3953857421875, 0.477874755859375, 0.56036376953125, 0.642852783203125, 0.725341796875, 0.807830810546875, 0.89031982421875, 0.972808837890625, 1.0552978515625, 1.137786865234375, 1.22027587890625, 1.302764892578125, 1.38525390625, 1.467742919921875, 1.55023193359375, 1.632720947265625, 1.7152099609375, 1.797698974609375, 1.88018798828125, 1.962677001953125, 2.045166015625, 2.127655029296875, 2.21014404296875, 2.292633056640625, 2.3751220703125, 2.457611083984375, 2.54010009765625, 2.622589111328125, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 7.0, 15.0, 14.0, 18.0, 19.0, 34.0, 45.0, 40.0, 63.0, 56.0, 77.0, 63.0, 70.0, 67.0, 58.0, 58.0, 62.0, 46.0, 32.0, 30.0, 30.0, 14.0, 14.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3828125, -1.342437744140625, -1.30206298828125, -1.261688232421875, -1.2213134765625, -1.180938720703125, -1.14056396484375, -1.100189208984375, -1.059814453125, -1.019439697265625, -0.97906494140625, -0.938690185546875, -0.8983154296875, -0.857940673828125, -0.81756591796875, -0.777191162109375, -0.73681640625, -0.696441650390625, -0.65606689453125, -0.615692138671875, -0.5753173828125, -0.534942626953125, -0.49456787109375, -0.454193115234375, -0.413818359375, -0.373443603515625, -0.33306884765625, -0.292694091796875, -0.2523193359375, -0.211944580078125, -0.17156982421875, -0.131195068359375, -0.0908203125, -0.050445556640625, -0.01007080078125, 0.030303955078125, 0.0706787109375, 0.111053466796875, 0.15142822265625, 0.191802978515625, 0.232177734375, 0.272552490234375, 0.31292724609375, 0.353302001953125, 0.3936767578125, 0.434051513671875, 0.47442626953125, 0.514801025390625, 0.55517578125, 0.595550537109375, 0.63592529296875, 0.676300048828125, 0.7166748046875, 0.757049560546875, 0.79742431640625, 0.837799072265625, 0.878173828125, 0.918548583984375, 0.95892333984375, 0.999298095703125, 1.0396728515625, 1.080047607421875, 1.12042236328125, 1.160797119140625, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 6.0, 6.0, 8.0, 14.0, 14.0, 19.0, 26.0, 13.0, 29.0, 21.0, 42.0, 37.0, 29.0, 40.0, 49.0, 32.0, 48.0, 41.0, 48.0, 54.0, 37.0, 40.0, 32.0, 25.0, 36.0, 33.0, 31.0, 16.0, 21.0, 19.0, 20.0, 19.0, 14.0, 17.0, 11.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.30906295776367, -57.45502471923828, -55.600990295410156, -53.746952056884766, -51.89291763305664, -50.03887939453125, -48.184844970703125, -46.330806732177734, -44.476768493652344, -42.62273025512695, -40.76869583129883, -38.91465759277344, -37.06062316894531, -35.20658493041992, -33.35254669189453, -31.498512268066406, -29.64447593688965, -27.79043960571289, -25.936403274536133, -24.082366943359375, -22.228328704833984, -20.374292373657227, -18.52025604248047, -16.666217803955078, -14.812182426452637, -12.958146095275879, -11.104108810424805, -9.250072479248047, -7.396035671234131, -5.541998863220215, -3.687962532043457, -1.8339252471923828, 0.020111083984375, 1.8741477727890015, 3.728184461593628, 5.582221031188965, 7.436257839202881, 9.290294647216797, 11.144330978393555, 12.998368263244629, 14.852404594421387, 16.70644187927246, 18.56047821044922, 20.414514541625977, 22.268550872802734, 24.122589111328125, 25.97662353515625, 27.83066177368164, 29.6846981048584, 31.538734436035156, 33.39277267456055, 35.24680709838867, 37.10084533691406, 38.95487976074219, 40.80891799926758, 42.66295623779297, 44.516990661621094, 46.371028900146484, 48.22506332397461, 50.0791015625, 51.933135986328125, 53.787174224853516, 55.641212463378906, 57.49524688720703, 59.34928512573242]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 5.0, 8.0, 14.0, 14.0, 19.0, 19.0, 22.0, 21.0, 22.0, 33.0, 30.0, 33.0, 40.0, 38.0, 34.0, 40.0, 42.0, 52.0, 44.0, 35.0, 23.0, 37.0, 28.0, 37.0, 35.0, 25.0, 37.0, 25.0, 21.0, 25.0, 25.0, 11.0, 23.0, 7.0, 12.0, 12.0, 6.0, 8.0, 1.0, 7.0, 7.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-66.13524627685547, -64.21019744873047, -62.28514099121094, -60.36009216308594, -58.43503952026367, -56.509986877441406, -54.584938049316406, -52.65988540649414, -50.734832763671875, -48.80978012084961, -46.884727478027344, -44.959678649902344, -43.03462600708008, -41.10957336425781, -39.18452453613281, -37.25947189331055, -35.33441925048828, -33.409366607666016, -31.484315872192383, -29.55926513671875, -27.634212493896484, -25.70915985107422, -23.784109115600586, -21.859058380126953, -19.934005737304688, -18.008953094482422, -16.08390235900879, -14.15885066986084, -12.23379898071289, -10.308747291564941, -8.383695602416992, -6.458643913269043, -4.533588409423828, -2.608536720275879, -0.6834850311279297, 1.2415666580200195, 3.1666183471679688, 5.091670036315918, 7.016721725463867, 8.941773414611816, 10.866825103759766, 12.791876792907715, 14.716928482055664, 16.641979217529297, 18.567031860351562, 20.492084503173828, 22.41713523864746, 24.342185974121094, 26.26723861694336, 28.192291259765625, 30.117341995239258, 32.04239273071289, 33.967445373535156, 35.89249801635742, 37.81755065917969, 39.74259948730469, 41.66765213012695, 43.59270477294922, 45.51775360107422, 47.442806243896484, 49.36785888671875, 51.292911529541016, 53.21796417236328, 55.14301300048828, 57.06806564331055]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 12.0, 15.0, 16.0, 33.0, 49.0, 95.0, 162.0, 254.0, 468.0, 770.0, 1227.0, 2063.0, 3467.0, 5427.0, 8808.0, 13491.0, 20254.0, 29931.0, 41901.0, 56631.0, 72347.0, 87351.0, 98721.0, 104176.0, 102123.0, 94705.0, 80175.0, 65328.0, 50269.0, 36078.0, 25508.0, 17168.0, 11135.0, 7174.0, 4477.0, 2629.0, 1563.0, 1021.0, 609.0, 347.0, 220.0, 126.0, 85.0, 47.0, 39.0, 18.0, 19.0, 7.0, 7.0, 6.0, 3.0, 3.0], "bins": [-51.625, -50.18212890625, -48.7392578125, -47.29638671875, -45.853515625, -44.41064453125, -42.9677734375, -41.52490234375, -40.08203125, -38.63916015625, -37.1962890625, -35.75341796875, -34.310546875, -32.86767578125, -31.4248046875, -29.98193359375, -28.5390625, -27.09619140625, -25.6533203125, -24.21044921875, -22.767578125, -21.32470703125, -19.8818359375, -18.43896484375, -16.99609375, -15.55322265625, -14.1103515625, -12.66748046875, -11.224609375, -9.78173828125, -8.3388671875, -6.89599609375, -5.453125, -4.01025390625, -2.5673828125, -1.12451171875, 0.318359375, 1.76123046875, 3.2041015625, 4.64697265625, 6.08984375, 7.53271484375, 8.9755859375, 10.41845703125, 11.861328125, 13.30419921875, 14.7470703125, 16.18994140625, 17.6328125, 19.07568359375, 20.5185546875, 21.96142578125, 23.404296875, 24.84716796875, 26.2900390625, 27.73291015625, 29.17578125, 30.61865234375, 32.0615234375, 33.50439453125, 34.947265625, 36.39013671875, 37.8330078125, 39.27587890625, 40.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 10.0, 5.0, 8.0, 13.0, 17.0, 18.0, 15.0, 23.0, 26.0, 20.0, 31.0, 31.0, 33.0, 46.0, 33.0, 41.0, 35.0, 38.0, 54.0, 48.0, 32.0, 29.0, 34.0, 27.0, 43.0, 31.0, 24.0, 36.0, 25.0, 24.0, 23.0, 21.0, 15.0, 17.0, 8.0, 13.0, 11.0, 7.0, 6.0, 2.0, 9.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-63.90625, -62.03857421875, -60.1708984375, -58.30322265625, -56.435546875, -54.56787109375, -52.7001953125, -50.83251953125, -48.96484375, -47.09716796875, -45.2294921875, -43.36181640625, -41.494140625, -39.62646484375, -37.7587890625, -35.89111328125, -34.0234375, -32.15576171875, -30.2880859375, -28.42041015625, -26.552734375, -24.68505859375, -22.8173828125, -20.94970703125, -19.08203125, -17.21435546875, -15.3466796875, -13.47900390625, -11.611328125, -9.74365234375, -7.8759765625, -6.00830078125, -4.140625, -2.27294921875, -0.4052734375, 1.46240234375, 3.330078125, 5.19775390625, 7.0654296875, 8.93310546875, 10.80078125, 12.66845703125, 14.5361328125, 16.40380859375, 18.271484375, 20.13916015625, 22.0068359375, 23.87451171875, 25.7421875, 27.60986328125, 29.4775390625, 31.34521484375, 33.212890625, 35.08056640625, 36.9482421875, 38.81591796875, 40.68359375, 42.55126953125, 44.4189453125, 46.28662109375, 48.154296875, 50.02197265625, 51.8896484375, 53.75732421875, 55.625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 14.0, 19.0, 28.0, 42.0, 71.0, 109.0, 225.0, 400.0, 653.0, 1157.0, 2127.0, 3751.0, 6469.0, 11028.0, 18452.0, 29698.0, 45634.0, 66206.0, 88613.0, 109342.0, 122416.0, 123803.0, 113711.0, 95141.0, 72251.0, 51625.0, 33926.0, 21354.0, 12700.0, 7534.0, 4322.0, 2441.0, 1436.0, 809.0, 460.0, 244.0, 118.0, 93.0, 50.0, 30.0, 21.0, 11.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-59.71875, -57.9697265625, -56.220703125, -54.4716796875, -52.72265625, -50.9736328125, -49.224609375, -47.4755859375, -45.7265625, -43.9775390625, -42.228515625, -40.4794921875, -38.73046875, -36.9814453125, -35.232421875, -33.4833984375, -31.734375, -29.9853515625, -28.236328125, -26.4873046875, -24.73828125, -22.9892578125, -21.240234375, -19.4912109375, -17.7421875, -15.9931640625, -14.244140625, -12.4951171875, -10.74609375, -8.9970703125, -7.248046875, -5.4990234375, -3.75, -2.0009765625, -0.251953125, 1.4970703125, 3.24609375, 4.9951171875, 6.744140625, 8.4931640625, 10.2421875, 11.9912109375, 13.740234375, 15.4892578125, 17.23828125, 18.9873046875, 20.736328125, 22.4853515625, 24.234375, 25.9833984375, 27.732421875, 29.4814453125, 31.23046875, 32.9794921875, 34.728515625, 36.4775390625, 38.2265625, 39.9755859375, 41.724609375, 43.4736328125, 45.22265625, 46.9716796875, 48.720703125, 50.4697265625, 52.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 1.0, 7.0, 5.0, 9.0, 8.0, 18.0, 8.0, 13.0, 13.0, 18.0, 21.0, 25.0, 43.0, 45.0, 32.0, 42.0, 42.0, 44.0, 32.0, 45.0, 43.0, 48.0, 40.0, 36.0, 51.0, 46.0, 42.0, 32.0, 20.0, 28.0, 21.0, 20.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.1611328125, -32.884765625, -31.6083984375, -30.33203125, -29.0556640625, -27.779296875, -26.5029296875, -25.2265625, -23.9501953125, -22.673828125, -21.3974609375, -20.12109375, -18.8447265625, -17.568359375, -16.2919921875, -15.015625, -13.7392578125, -12.462890625, -11.1865234375, -9.91015625, -8.6337890625, -7.357421875, -6.0810546875, -4.8046875, -3.5283203125, -2.251953125, -0.9755859375, 0.30078125, 1.5771484375, 2.853515625, 4.1298828125, 5.40625, 6.6826171875, 7.958984375, 9.2353515625, 10.51171875, 11.7880859375, 13.064453125, 14.3408203125, 15.6171875, 16.8935546875, 18.169921875, 19.4462890625, 20.72265625, 21.9990234375, 23.275390625, 24.5517578125, 25.828125, 27.1044921875, 28.380859375, 29.6572265625, 30.93359375, 32.2099609375, 33.486328125, 34.7626953125, 36.0390625, 37.3154296875, 38.591796875, 39.8681640625, 41.14453125, 42.4208984375, 43.697265625, 44.9736328125, 46.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 11.0, 26.0, 34.0, 57.0, 58.0, 121.0, 203.0, 293.0, 503.0, 857.0, 1322.0, 2229.0, 3670.0, 6008.0, 9759.0, 15776.0, 25028.0, 38276.0, 56786.0, 79037.0, 101597.0, 119689.0, 125760.0, 119399.0, 101764.0, 79075.0, 56686.0, 38493.0, 24879.0, 15709.0, 9812.0, 5992.0, 3702.0, 2404.0, 1351.0, 852.0, 538.0, 310.0, 189.0, 108.0, 81.0, 39.0, 25.0, 18.0, 9.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.265625, -20.630859375, -19.99609375, -19.361328125, -18.7265625, -18.091796875, -17.45703125, -16.822265625, -16.1875, -15.552734375, -14.91796875, -14.283203125, -13.6484375, -13.013671875, -12.37890625, -11.744140625, -11.109375, -10.474609375, -9.83984375, -9.205078125, -8.5703125, -7.935546875, -7.30078125, -6.666015625, -6.03125, -5.396484375, -4.76171875, -4.126953125, -3.4921875, -2.857421875, -2.22265625, -1.587890625, -0.953125, -0.318359375, 0.31640625, 0.951171875, 1.5859375, 2.220703125, 2.85546875, 3.490234375, 4.125, 4.759765625, 5.39453125, 6.029296875, 6.6640625, 7.298828125, 7.93359375, 8.568359375, 9.203125, 9.837890625, 10.47265625, 11.107421875, 11.7421875, 12.376953125, 13.01171875, 13.646484375, 14.28125, 14.916015625, 15.55078125, 16.185546875, 16.8203125, 17.455078125, 18.08984375, 18.724609375, 19.359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 0.0, 9.0, 6.0, 11.0, 9.0, 19.0, 26.0, 30.0, 28.0, 29.0, 40.0, 29.0, 35.0, 44.0, 47.0, 39.0, 58.0, 50.0, 52.0, 53.0, 52.0, 48.0, 54.0, 35.0, 30.0, 28.0, 21.0, 13.0, 14.0, 19.0, 13.0, 15.0, 8.0, 13.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027179718017578125, -0.0026380717754364014, -0.0025581717491149902, -0.002478271722793579, -0.002398371696472168, -0.002318471670150757, -0.0022385716438293457, -0.0021586716175079346, -0.0020787715911865234, -0.0019988715648651123, -0.0019189715385437012, -0.00183907151222229, -0.001759171485900879, -0.0016792714595794678, -0.0015993714332580566, -0.0015194714069366455, -0.0014395713806152344, -0.0013596713542938232, -0.0012797713279724121, -0.001199871301651001, -0.0011199712753295898, -0.0010400712490081787, -0.0009601712226867676, -0.0008802711963653564, -0.0008003711700439453, -0.0007204711437225342, -0.000640571117401123, -0.0005606710910797119, -0.0004807710647583008, -0.00040087103843688965, -0.0003209710121154785, -0.00024107098579406738, -0.00016117095947265625, -8.127093315124512e-05, -1.3709068298339844e-06, 7.852911949157715e-05, 0.00015842914581298828, 0.00023832917213439941, 0.00031822919845581055, 0.0003981292247772217, 0.0004780292510986328, 0.0005579292774200439, 0.0006378293037414551, 0.0007177293300628662, 0.0007976293563842773, 0.0008775293827056885, 0.0009574294090270996, 0.0010373294353485107, 0.0011172294616699219, 0.001197129487991333, 0.0012770295143127441, 0.0013569295406341553, 0.0014368295669555664, 0.0015167295932769775, 0.0015966296195983887, 0.0016765296459197998, 0.001756429672241211, 0.001836329698562622, 0.0019162297248840332, 0.0019961297512054443, 0.0020760297775268555, 0.0021559298038482666, 0.0022358298301696777, 0.002315729856491089, 0.0023956298828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 6.0, 10.0, 9.0, 15.0, 24.0, 29.0, 54.0, 79.0, 110.0, 181.0, 239.0, 386.0, 592.0, 894.0, 1309.0, 2182.0, 3423.0, 5398.0, 8586.0, 13496.0, 20716.0, 30839.0, 45531.0, 62592.0, 82705.0, 101267.0, 113885.0, 116311.0, 108279.0, 92450.0, 73503.0, 53948.0, 37497.0, 25511.0, 16645.0, 10920.0, 6888.0, 4310.0, 2761.0, 1780.0, 1084.0, 688.0, 512.0, 318.0, 188.0, 141.0, 74.0, 67.0, 42.0, 27.0, 30.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.61376953125, -17.9775390625, -17.34130859375, -16.705078125, -16.06884765625, -15.4326171875, -14.79638671875, -14.16015625, -13.52392578125, -12.8876953125, -12.25146484375, -11.615234375, -10.97900390625, -10.3427734375, -9.70654296875, -9.0703125, -8.43408203125, -7.7978515625, -7.16162109375, -6.525390625, -5.88916015625, -5.2529296875, -4.61669921875, -3.98046875, -3.34423828125, -2.7080078125, -2.07177734375, -1.435546875, -0.79931640625, -0.1630859375, 0.47314453125, 1.109375, 1.74560546875, 2.3818359375, 3.01806640625, 3.654296875, 4.29052734375, 4.9267578125, 5.56298828125, 6.19921875, 6.83544921875, 7.4716796875, 8.10791015625, 8.744140625, 9.38037109375, 10.0166015625, 10.65283203125, 11.2890625, 11.92529296875, 12.5615234375, 13.19775390625, 13.833984375, 14.47021484375, 15.1064453125, 15.74267578125, 16.37890625, 17.01513671875, 17.6513671875, 18.28759765625, 18.923828125, 19.56005859375, 20.1962890625, 20.83251953125, 21.46875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 18.0, 14.0, 26.0, 34.0, 28.0, 29.0, 44.0, 43.0, 53.0, 32.0, 40.0, 53.0, 39.0, 45.0, 45.0, 55.0, 37.0, 46.0, 47.0, 37.0, 33.0, 26.0, 25.0, 18.0, 15.0, 10.0, 9.0, 13.0, 14.0, 9.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.5401611328125, -10.244384765625, -9.9486083984375, -9.65283203125, -9.3570556640625, -9.061279296875, -8.7655029296875, -8.4697265625, -8.1739501953125, -7.878173828125, -7.5823974609375, -7.28662109375, -6.9908447265625, -6.695068359375, -6.3992919921875, -6.103515625, -5.8077392578125, -5.511962890625, -5.2161865234375, -4.92041015625, -4.6246337890625, -4.328857421875, -4.0330810546875, -3.7373046875, -3.4415283203125, -3.145751953125, -2.8499755859375, -2.55419921875, -2.2584228515625, -1.962646484375, -1.6668701171875, -1.37109375, -1.0753173828125, -0.779541015625, -0.4837646484375, -0.18798828125, 0.1077880859375, 0.403564453125, 0.6993408203125, 0.9951171875, 1.2908935546875, 1.586669921875, 1.8824462890625, 2.17822265625, 2.4739990234375, 2.769775390625, 3.0655517578125, 3.361328125, 3.6571044921875, 3.952880859375, 4.2486572265625, 4.54443359375, 4.8402099609375, 5.135986328125, 5.4317626953125, 5.7275390625, 6.0233154296875, 6.319091796875, 6.6148681640625, 6.91064453125, 7.2064208984375, 7.502197265625, 7.7979736328125, 8.09375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 9.0, 6.0, 7.0, 10.0, 12.0, 16.0, 17.0, 13.0, 21.0, 14.0, 20.0, 28.0, 29.0, 40.0, 26.0, 30.0, 35.0, 33.0, 45.0, 32.0, 48.0, 36.0, 41.0, 30.0, 36.0, 37.0, 25.0, 40.0, 22.0, 34.0, 32.0, 30.0, 13.0, 15.0, 16.0, 20.0, 12.0, 19.0, 12.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.6223258972168, -50.923892974853516, -49.2254638671875, -47.52703094482422, -45.82859802246094, -44.130165100097656, -42.431732177734375, -40.73330307006836, -39.03487014770508, -37.3364372253418, -35.63800811767578, -33.9395751953125, -32.24114227294922, -30.542709350585938, -28.84427833557129, -27.14584732055664, -25.44741439819336, -23.748981475830078, -22.05055046081543, -20.35211944580078, -18.6536865234375, -16.95525360107422, -15.25682258605957, -13.558390617370605, -11.85995864868164, -10.161526679992676, -8.463094711303711, -6.764662742614746, -5.066230773925781, -3.3677988052368164, -1.6693668365478516, 0.02906513214111328, 1.7274932861328125, 3.4259252548217773, 5.124357223510742, 6.822789192199707, 8.521221160888672, 10.219653129577637, 11.918085098266602, 13.616517066955566, 15.314949035644531, 17.013381958007812, 18.71181297302246, 20.41024398803711, 22.10867691040039, 23.807109832763672, 25.50554084777832, 27.20397186279297, 28.90240478515625, 30.60083770751953, 32.29927062988281, 33.99769973754883, 35.69613265991211, 37.39456558227539, 39.092994689941406, 40.79142761230469, 42.48986053466797, 44.18829345703125, 45.88672637939453, 47.58515548706055, 49.28358840942383, 50.98202133178711, 52.680450439453125, 54.378883361816406, 56.07731628417969]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 9.0, 1.0, 6.0, 6.0, 16.0, 18.0, 15.0, 20.0, 17.0, 16.0, 24.0, 32.0, 28.0, 34.0, 28.0, 34.0, 38.0, 33.0, 36.0, 35.0, 32.0, 43.0, 48.0, 46.0, 39.0, 21.0, 17.0, 29.0, 32.0, 23.0, 27.0, 24.0, 20.0, 22.0, 17.0, 18.0, 11.0, 17.0, 10.0, 9.0, 11.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0], "bins": [-60.79109191894531, -58.962013244628906, -57.132938385009766, -55.303863525390625, -53.47478485107422, -51.64570617675781, -49.81663131713867, -47.98755645751953, -46.158477783203125, -44.32939910888672, -42.50032424926758, -40.67124938964844, -38.84217071533203, -37.013092041015625, -35.184017181396484, -33.354942321777344, -31.525863647460938, -29.696786880493164, -27.86771011352539, -26.038633346557617, -24.209556579589844, -22.38047981262207, -20.551403045654297, -18.722326278686523, -16.89324951171875, -15.064172744750977, -13.235095977783203, -11.40601921081543, -9.576942443847656, -7.747865676879883, -5.918788909912109, -4.089712142944336, -2.2606353759765625, -0.43155860900878906, 1.3975181579589844, 3.226594924926758, 5.055671691894531, 6.884748458862305, 8.713825225830078, 10.542901992797852, 12.371978759765625, 14.201055526733398, 16.030132293701172, 17.859209060668945, 19.68828582763672, 21.517362594604492, 23.346439361572266, 25.17551612854004, 27.004592895507812, 28.833669662475586, 30.66274642944336, 32.4918212890625, 34.320899963378906, 36.14997863769531, 37.97905349731445, 39.808128356933594, 41.63720703125, 43.466285705566406, 45.29536056518555, 47.12443542480469, 48.953514099121094, 50.7825927734375, 52.61166763305664, 54.44074249267578, 56.26982116699219]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 15.0, 16.0, 43.0, 53.0, 110.0, 202.0, 302.0, 560.0, 948.0, 1499.0, 2658.0, 4424.0, 7812.0, 12695.0, 21313.0, 34675.0, 56118.0, 87907.0, 135690.0, 197674.0, 274988.0, 359450.0, 433133.0, 476629.0, 474078.0, 429743.0, 355592.0, 271669.0, 193760.0, 132617.0, 86380.0, 54948.0, 34199.0, 20833.0, 12862.0, 7606.0, 4562.0, 2650.0, 1510.0, 927.0, 585.0, 333.0, 217.0, 109.0, 72.0, 44.0, 24.0, 16.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-50.0, -48.48388671875, -46.9677734375, -45.45166015625, -43.935546875, -42.41943359375, -40.9033203125, -39.38720703125, -37.87109375, -36.35498046875, -34.8388671875, -33.32275390625, -31.806640625, -30.29052734375, -28.7744140625, -27.25830078125, -25.7421875, -24.22607421875, -22.7099609375, -21.19384765625, -19.677734375, -18.16162109375, -16.6455078125, -15.12939453125, -13.61328125, -12.09716796875, -10.5810546875, -9.06494140625, -7.548828125, -6.03271484375, -4.5166015625, -3.00048828125, -1.484375, 0.03173828125, 1.5478515625, 3.06396484375, 4.580078125, 6.09619140625, 7.6123046875, 9.12841796875, 10.64453125, 12.16064453125, 13.6767578125, 15.19287109375, 16.708984375, 18.22509765625, 19.7412109375, 21.25732421875, 22.7734375, 24.28955078125, 25.8056640625, 27.32177734375, 28.837890625, 30.35400390625, 31.8701171875, 33.38623046875, 34.90234375, 36.41845703125, 37.9345703125, 39.45068359375, 40.966796875, 42.48291015625, 43.9990234375, 45.51513671875, 47.03125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 3.0, 7.0, 14.0, 17.0, 18.0, 17.0, 14.0, 10.0, 35.0, 27.0, 28.0, 37.0, 26.0, 33.0, 32.0, 33.0, 33.0, 42.0, 36.0, 41.0, 40.0, 53.0, 33.0, 26.0, 16.0, 27.0, 34.0, 20.0, 30.0, 23.0, 27.0, 16.0, 16.0, 19.0, 14.0, 16.0, 16.0, 10.0, 9.0, 6.0, 7.0, 10.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-53.53125, -51.93359375, -50.3359375, -48.73828125, -47.140625, -45.54296875, -43.9453125, -42.34765625, -40.75, -39.15234375, -37.5546875, -35.95703125, -34.359375, -32.76171875, -31.1640625, -29.56640625, -27.96875, -26.37109375, -24.7734375, -23.17578125, -21.578125, -19.98046875, -18.3828125, -16.78515625, -15.1875, -13.58984375, -11.9921875, -10.39453125, -8.796875, -7.19921875, -5.6015625, -4.00390625, -2.40625, -0.80859375, 0.7890625, 2.38671875, 3.984375, 5.58203125, 7.1796875, 8.77734375, 10.375, 11.97265625, 13.5703125, 15.16796875, 16.765625, 18.36328125, 19.9609375, 21.55859375, 23.15625, 24.75390625, 26.3515625, 27.94921875, 29.546875, 31.14453125, 32.7421875, 34.33984375, 35.9375, 37.53515625, 39.1328125, 40.73046875, 42.328125, 43.92578125, 45.5234375, 47.12109375, 48.71875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 15.0, 21.0, 45.0, 64.0, 87.0, 155.0, 255.0, 443.0, 727.0, 1218.0, 1868.0, 3018.0, 4789.0, 7671.0, 11638.0, 18312.0, 27826.0, 41486.0, 60697.0, 87082.0, 121527.0, 162519.0, 212577.0, 264046.0, 314088.0, 353107.0, 376755.0, 377906.0, 358145.0, 319335.0, 270766.0, 219291.0, 169721.0, 125538.0, 91449.0, 63584.0, 44140.0, 29060.0, 19277.0, 12505.0, 8014.0, 5046.0, 3227.0, 1969.0, 1299.0, 731.0, 498.0, 303.0, 169.0, 109.0, 77.0, 36.0, 24.0, 11.0, 7.0, 5.0, 2.0, 3.0], "bins": [-44.625, -43.275390625, -41.92578125, -40.576171875, -39.2265625, -37.876953125, -36.52734375, -35.177734375, -33.828125, -32.478515625, -31.12890625, -29.779296875, -28.4296875, -27.080078125, -25.73046875, -24.380859375, -23.03125, -21.681640625, -20.33203125, -18.982421875, -17.6328125, -16.283203125, -14.93359375, -13.583984375, -12.234375, -10.884765625, -9.53515625, -8.185546875, -6.8359375, -5.486328125, -4.13671875, -2.787109375, -1.4375, -0.087890625, 1.26171875, 2.611328125, 3.9609375, 5.310546875, 6.66015625, 8.009765625, 9.359375, 10.708984375, 12.05859375, 13.408203125, 14.7578125, 16.107421875, 17.45703125, 18.806640625, 20.15625, 21.505859375, 22.85546875, 24.205078125, 25.5546875, 26.904296875, 28.25390625, 29.603515625, 30.953125, 32.302734375, 33.65234375, 35.001953125, 36.3515625, 37.701171875, 39.05078125, 40.400390625, 41.75]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 8.0, 11.0, 17.0, 19.0, 19.0, 20.0, 41.0, 33.0, 59.0, 67.0, 73.0, 93.0, 110.0, 115.0, 123.0, 132.0, 176.0, 167.0, 175.0, 197.0, 202.0, 216.0, 192.0, 212.0, 189.0, 175.0, 157.0, 159.0, 147.0, 127.0, 110.0, 94.0, 99.0, 60.0, 63.0, 36.0, 43.0, 35.0, 24.0, 17.0, 8.0, 14.0, 9.0, 5.0, 5.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.754638671875, -21.96240234375, -21.170166015625, -20.3779296875, -19.585693359375, -18.79345703125, -18.001220703125, -17.208984375, -16.416748046875, -15.62451171875, -14.832275390625, -14.0400390625, -13.247802734375, -12.45556640625, -11.663330078125, -10.87109375, -10.078857421875, -9.28662109375, -8.494384765625, -7.7021484375, -6.909912109375, -6.11767578125, -5.325439453125, -4.533203125, -3.740966796875, -2.94873046875, -2.156494140625, -1.3642578125, -0.572021484375, 0.22021484375, 1.012451171875, 1.8046875, 2.596923828125, 3.38916015625, 4.181396484375, 4.9736328125, 5.765869140625, 6.55810546875, 7.350341796875, 8.142578125, 8.934814453125, 9.72705078125, 10.519287109375, 11.3115234375, 12.103759765625, 12.89599609375, 13.688232421875, 14.48046875, 15.272705078125, 16.06494140625, 16.857177734375, 17.6494140625, 18.441650390625, 19.23388671875, 20.026123046875, 20.818359375, 21.610595703125, 22.40283203125, 23.195068359375, 23.9873046875, 24.779541015625, 25.57177734375, 26.364013671875, 27.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 9.0, 8.0, 17.0, 17.0, 17.0, 17.0, 22.0, 17.0, 25.0, 25.0, 27.0, 30.0, 36.0, 35.0, 40.0, 36.0, 50.0, 42.0, 37.0, 39.0, 47.0, 40.0, 33.0, 37.0, 40.0, 31.0, 28.0, 24.0, 21.0, 19.0, 20.0, 15.0, 13.0, 12.0, 11.0, 16.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-55.089813232421875, -53.33258819580078, -51.57536697387695, -49.818145751953125, -48.06092071533203, -46.30369567871094, -44.54647445678711, -42.78925323486328, -41.03202819824219, -39.274803161621094, -37.517581939697266, -35.76036071777344, -34.003135681152344, -32.24591064453125, -30.488689422607422, -28.73146629333496, -26.9742431640625, -25.21702003479004, -23.459796905517578, -21.702573776245117, -19.945350646972656, -18.188127517700195, -16.430904388427734, -14.673681259155273, -12.916458129882812, -11.159235000610352, -9.40201187133789, -7.64478874206543, -5.887565612792969, -4.130342483520508, -2.373119354248047, -0.6158962249755859, 1.1413230895996094, 2.8985462188720703, 4.655769348144531, 6.412992477416992, 8.170215606689453, 9.927438735961914, 11.684661865234375, 13.441884994506836, 15.199108123779297, 16.956331253051758, 18.71355438232422, 20.47077751159668, 22.22800064086914, 23.9852237701416, 25.742446899414062, 27.499670028686523, 29.256893157958984, 31.014116287231445, 32.771339416503906, 34.528564453125, 36.28578567504883, 38.043006896972656, 39.80023193359375, 41.557456970214844, 43.31467819213867, 45.0718994140625, 46.829124450683594, 48.58634948730469, 50.343570709228516, 52.100791931152344, 53.85801696777344, 55.61524200439453, 57.37246322631836]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 9.0, 17.0, 8.0, 20.0, 15.0, 20.0, 19.0, 18.0, 27.0, 38.0, 43.0, 33.0, 37.0, 54.0, 56.0, 48.0, 42.0, 54.0, 45.0, 50.0, 34.0, 28.0, 30.0, 40.0, 34.0, 20.0, 20.0, 24.0, 16.0, 24.0, 9.0, 18.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.63072204589844, -65.49087524414062, -63.35102844238281, -61.211181640625, -59.07133483886719, -56.931488037109375, -54.79164123535156, -52.65179443359375, -50.51194763183594, -48.372100830078125, -46.23225402832031, -44.0924072265625, -41.95256042480469, -39.812713623046875, -37.67286682128906, -35.53302001953125, -33.39317321777344, -31.253326416015625, -29.113479614257812, -26.9736328125, -24.833786010742188, -22.693939208984375, -20.554092407226562, -18.41424560546875, -16.274398803710938, -14.134552001953125, -11.994705200195312, -9.8548583984375, -7.7150115966796875, -5.575164794921875, -3.4353179931640625, -1.29547119140625, 0.8443679809570312, 2.9842147827148438, 5.124061584472656, 7.263908386230469, 9.403755187988281, 11.543601989746094, 13.683448791503906, 15.823295593261719, 17.96314239501953, 20.102989196777344, 22.242835998535156, 24.38268280029297, 26.52252960205078, 28.662376403808594, 30.802223205566406, 32.94207000732422, 35.08191680908203, 37.221763610839844, 39.361610412597656, 41.50145721435547, 43.64130401611328, 45.781150817871094, 47.920997619628906, 50.06084442138672, 52.20069122314453, 54.340538024902344, 56.480384826660156, 58.62023162841797, 60.76007843017578, 62.899925231933594, 65.0397720336914, 67.17961883544922, 69.31946563720703]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 25.0, 26.0, 62.0, 91.0, 138.0, 260.0, 396.0, 603.0, 914.0, 1605.0, 2527.0, 4223.0, 6642.0, 10523.0, 16486.0, 24841.0, 37094.0, 52564.0, 70562.0, 89126.0, 105253.0, 114155.0, 112891.0, 102152.0, 84774.0, 66581.0, 48129.0, 33654.0, 22522.0, 14510.0, 9563.0, 5936.0, 3661.0, 2251.0, 1482.0, 885.0, 568.0, 317.0, 194.0, 133.0, 80.0, 50.0, 38.0, 18.0, 9.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.265625, -16.740478515625, -16.21533203125, -15.690185546875, -15.1650390625, -14.639892578125, -14.11474609375, -13.589599609375, -13.064453125, -12.539306640625, -12.01416015625, -11.489013671875, -10.9638671875, -10.438720703125, -9.91357421875, -9.388427734375, -8.86328125, -8.338134765625, -7.81298828125, -7.287841796875, -6.7626953125, -6.237548828125, -5.71240234375, -5.187255859375, -4.662109375, -4.136962890625, -3.61181640625, -3.086669921875, -2.5615234375, -2.036376953125, -1.51123046875, -0.986083984375, -0.4609375, 0.064208984375, 0.58935546875, 1.114501953125, 1.6396484375, 2.164794921875, 2.68994140625, 3.215087890625, 3.740234375, 4.265380859375, 4.79052734375, 5.315673828125, 5.8408203125, 6.365966796875, 6.89111328125, 7.416259765625, 7.94140625, 8.466552734375, 8.99169921875, 9.516845703125, 10.0419921875, 10.567138671875, 11.09228515625, 11.617431640625, 12.142578125, 12.667724609375, 13.19287109375, 13.718017578125, 14.2431640625, 14.768310546875, 15.29345703125, 15.818603515625, 16.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 14.0, 10.0, 19.0, 16.0, 21.0, 17.0, 20.0, 27.0, 41.0, 39.0, 36.0, 37.0, 55.0, 50.0, 53.0, 40.0, 52.0, 53.0, 43.0, 35.0, 28.0, 28.0, 43.0, 31.0, 20.0, 21.0, 21.0, 17.0, 25.0, 10.0, 16.0, 8.0, 6.0, 1.0, 8.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.375, -65.232421875, -63.08984375, -60.947265625, -58.8046875, -56.662109375, -54.51953125, -52.376953125, -50.234375, -48.091796875, -45.94921875, -43.806640625, -41.6640625, -39.521484375, -37.37890625, -35.236328125, -33.09375, -30.951171875, -28.80859375, -26.666015625, -24.5234375, -22.380859375, -20.23828125, -18.095703125, -15.953125, -13.810546875, -11.66796875, -9.525390625, -7.3828125, -5.240234375, -3.09765625, -0.955078125, 1.1875, 3.330078125, 5.47265625, 7.615234375, 9.7578125, 11.900390625, 14.04296875, 16.185546875, 18.328125, 20.470703125, 22.61328125, 24.755859375, 26.8984375, 29.041015625, 31.18359375, 33.326171875, 35.46875, 37.611328125, 39.75390625, 41.896484375, 44.0390625, 46.181640625, 48.32421875, 50.466796875, 52.609375, 54.751953125, 56.89453125, 59.037109375, 61.1796875, 63.322265625, 65.46484375, 67.607421875, 69.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 19.0, 28.0, 42.0, 59.0, 101.0, 124.0, 210.0, 380.0, 701.0, 1161.0, 1983.0, 3774.0, 6799.0, 12682.0, 24370.0, 64058.0, 846814.0, 41624.0, 19884.0, 10689.0, 5795.0, 3108.0, 1713.0, 987.0, 581.0, 323.0, 197.0, 124.0, 83.0, 51.0, 20.0, 14.0, 13.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-68.375, -66.26171875, -64.1484375, -62.03515625, -59.921875, -57.80859375, -55.6953125, -53.58203125, -51.46875, -49.35546875, -47.2421875, -45.12890625, -43.015625, -40.90234375, -38.7890625, -36.67578125, -34.5625, -32.44921875, -30.3359375, -28.22265625, -26.109375, -23.99609375, -21.8828125, -19.76953125, -17.65625, -15.54296875, -13.4296875, -11.31640625, -9.203125, -7.08984375, -4.9765625, -2.86328125, -0.75, 1.36328125, 3.4765625, 5.58984375, 7.703125, 9.81640625, 11.9296875, 14.04296875, 16.15625, 18.26953125, 20.3828125, 22.49609375, 24.609375, 26.72265625, 28.8359375, 30.94921875, 33.0625, 35.17578125, 37.2890625, 39.40234375, 41.515625, 43.62890625, 45.7421875, 47.85546875, 49.96875, 52.08203125, 54.1953125, 56.30859375, 58.421875, 60.53515625, 62.6484375, 64.76171875, 66.875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 7.0, 12.0, 12.0, 15.0, 9.0, 14.0, 5.0, 19.0, 21.0, 22.0, 26.0, 42.0, 27.0, 27.0, 37.0, 34.0, 41.0, 35.0, 43.0, 42.0, 48.0, 37.0, 42.0, 31.0, 38.0, 22.0, 22.0, 29.0, 34.0, 32.0, 29.0, 21.0, 20.0, 10.0, 11.0, 14.0, 22.0, 6.0, 12.0, 8.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.90625, -39.634765625, -38.36328125, -37.091796875, -35.8203125, -34.548828125, -33.27734375, -32.005859375, -30.734375, -29.462890625, -28.19140625, -26.919921875, -25.6484375, -24.376953125, -23.10546875, -21.833984375, -20.5625, -19.291015625, -18.01953125, -16.748046875, -15.4765625, -14.205078125, -12.93359375, -11.662109375, -10.390625, -9.119140625, -7.84765625, -6.576171875, -5.3046875, -4.033203125, -2.76171875, -1.490234375, -0.21875, 1.052734375, 2.32421875, 3.595703125, 4.8671875, 6.138671875, 7.41015625, 8.681640625, 9.953125, 11.224609375, 12.49609375, 13.767578125, 15.0390625, 16.310546875, 17.58203125, 18.853515625, 20.125, 21.396484375, 22.66796875, 23.939453125, 25.2109375, 26.482421875, 27.75390625, 29.025390625, 30.296875, 31.568359375, 32.83984375, 34.111328125, 35.3828125, 36.654296875, 37.92578125, 39.197265625, 40.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 13.0, 4.0, 8.0, 12.0, 25.0, 21.0, 44.0, 62.0, 109.0, 173.0, 270.0, 430.0, 665.0, 1062.0, 1890.0, 3042.0, 5166.0, 9334.0, 17119.0, 35667.0, 691283.0, 219865.0, 28840.0, 14297.0, 7822.0, 4469.0, 2664.0, 1589.0, 966.0, 588.0, 362.0, 223.0, 151.0, 115.0, 71.0, 46.0, 28.0, 21.0, 9.0, 6.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.046875, -3.923736572265625, -3.80059814453125, -3.677459716796875, -3.5543212890625, -3.431182861328125, -3.30804443359375, -3.184906005859375, -3.061767578125, -2.938629150390625, -2.81549072265625, -2.692352294921875, -2.5692138671875, -2.446075439453125, -2.32293701171875, -2.199798583984375, -2.07666015625, -1.953521728515625, -1.83038330078125, -1.707244873046875, -1.5841064453125, -1.460968017578125, -1.33782958984375, -1.214691162109375, -1.091552734375, -0.968414306640625, -0.84527587890625, -0.722137451171875, -0.5989990234375, -0.475860595703125, -0.35272216796875, -0.229583740234375, -0.1064453125, 0.016693115234375, 0.13983154296875, 0.262969970703125, 0.3861083984375, 0.509246826171875, 0.63238525390625, 0.755523681640625, 0.878662109375, 1.001800537109375, 1.12493896484375, 1.248077392578125, 1.3712158203125, 1.494354248046875, 1.61749267578125, 1.740631103515625, 1.86376953125, 1.986907958984375, 2.11004638671875, 2.233184814453125, 2.3563232421875, 2.479461669921875, 2.60260009765625, 2.725738525390625, 2.848876953125, 2.972015380859375, 3.09515380859375, 3.218292236328125, 3.3414306640625, 3.464569091796875, 3.58770751953125, 3.710845947265625, 3.833984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 15.0, 24.0, 19.0, 22.0, 20.0, 31.0, 41.0, 53.0, 45.0, 64.0, 62.0, 55.0, 69.0, 69.0, 62.0, 52.0, 51.0, 46.0, 38.0, 34.0, 22.0, 13.0, 11.0, 11.0, 15.0, 6.0, 3.0, 3.0, 2.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032973289489746094, -0.0003195516765117645, -0.0003093704581260681, -0.0002991892397403717, -0.0002890080213546753, -0.0002788268029689789, -0.00026864558458328247, -0.00025846436619758606, -0.00024828314781188965, -0.00023810192942619324, -0.00022792071104049683, -0.00021773949265480042, -0.000207558274269104, -0.0001973770558834076, -0.00018719583749771118, -0.00017701461911201477, -0.00016683340072631836, -0.00015665218234062195, -0.00014647096395492554, -0.00013628974556922913, -0.00012610852718353271, -0.0001159273087978363, -0.00010574609041213989, -9.556487202644348e-05, -8.538365364074707e-05, -7.520243525505066e-05, -6.502121686935425e-05, -5.483999848365784e-05, -4.4658780097961426e-05, -3.4477561712265015e-05, -2.4296343326568604e-05, -1.4115124940872192e-05, -3.933906555175781e-06, 6.24731183052063e-06, 1.642853021621704e-05, 2.6609748601913452e-05, 3.679096698760986e-05, 4.6972185373306274e-05, 5.7153403759002686e-05, 6.73346221446991e-05, 7.751584053039551e-05, 8.769705891609192e-05, 9.787827730178833e-05, 0.00010805949568748474, 0.00011824071407318115, 0.00012842193245887756, 0.00013860315084457397, 0.00014878436923027039, 0.0001589655876159668, 0.0001691468060016632, 0.00017932802438735962, 0.00018950924277305603, 0.00019969046115875244, 0.00020987167954444885, 0.00022005289793014526, 0.00023023411631584167, 0.00024041533470153809, 0.0002505965530872345, 0.0002607777714729309, 0.0002709589898586273, 0.00028114020824432373, 0.00029132142663002014, 0.00030150264501571655, 0.00031168386340141296, 0.0003218650817871094]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 20.0, 22.0, 48.0, 83.0, 96.0, 142.0, 225.0, 328.0, 539.0, 804.0, 1305.0, 1914.0, 2805.0, 4298.0, 6560.0, 9772.0, 14553.0, 21426.0, 30320.0, 42355.0, 56279.0, 72241.0, 87534.0, 99925.0, 104887.0, 102726.0, 92544.0, 77478.0, 61433.0, 46939.0, 34226.0, 24359.0, 16709.0, 11382.0, 7474.0, 5017.0, 3372.0, 2109.0, 1528.0, 947.0, 672.0, 386.0, 258.0, 174.0, 112.0, 86.0, 37.0, 37.0, 14.0, 14.0, 12.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.19140625, -2.122222900390625, -2.05303955078125, -1.983856201171875, -1.9146728515625, -1.845489501953125, -1.77630615234375, -1.707122802734375, -1.637939453125, -1.568756103515625, -1.49957275390625, -1.430389404296875, -1.3612060546875, -1.292022705078125, -1.22283935546875, -1.153656005859375, -1.08447265625, -1.015289306640625, -0.94610595703125, -0.876922607421875, -0.8077392578125, -0.738555908203125, -0.66937255859375, -0.600189208984375, -0.531005859375, -0.461822509765625, -0.39263916015625, -0.323455810546875, -0.2542724609375, -0.185089111328125, -0.11590576171875, -0.046722412109375, 0.0224609375, 0.091644287109375, 0.16082763671875, 0.230010986328125, 0.2991943359375, 0.368377685546875, 0.43756103515625, 0.506744384765625, 0.575927734375, 0.645111083984375, 0.71429443359375, 0.783477783203125, 0.8526611328125, 0.921844482421875, 0.99102783203125, 1.060211181640625, 1.12939453125, 1.198577880859375, 1.26776123046875, 1.336944580078125, 1.4061279296875, 1.475311279296875, 1.54449462890625, 1.613677978515625, 1.682861328125, 1.752044677734375, 1.82122802734375, 1.890411376953125, 1.9595947265625, 2.028778076171875, 2.09796142578125, 2.167144775390625, 2.236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 4.0, 13.0, 17.0, 19.0, 13.0, 22.0, 20.0, 17.0, 30.0, 29.0, 26.0, 40.0, 32.0, 39.0, 28.0, 31.0, 30.0, 40.0, 35.0, 43.0, 31.0, 38.0, 34.0, 40.0, 27.0, 28.0, 32.0, 28.0, 24.0, 34.0, 33.0, 23.0, 20.0, 18.0, 18.0, 7.0, 9.0, 8.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9815673828125, -0.948486328125, -0.9154052734375, -0.88232421875, -0.8492431640625, -0.816162109375, -0.7830810546875, -0.75, -0.7169189453125, -0.683837890625, -0.6507568359375, -0.61767578125, -0.5845947265625, -0.551513671875, -0.5184326171875, -0.4853515625, -0.4522705078125, -0.419189453125, -0.3861083984375, -0.35302734375, -0.3199462890625, -0.286865234375, -0.2537841796875, -0.220703125, -0.1876220703125, -0.154541015625, -0.1214599609375, -0.08837890625, -0.0552978515625, -0.022216796875, 0.0108642578125, 0.0439453125, 0.0770263671875, 0.110107421875, 0.1431884765625, 0.17626953125, 0.2093505859375, 0.242431640625, 0.2755126953125, 0.30859375, 0.3416748046875, 0.374755859375, 0.4078369140625, 0.44091796875, 0.4739990234375, 0.507080078125, 0.5401611328125, 0.5732421875, 0.6063232421875, 0.639404296875, 0.6724853515625, 0.70556640625, 0.7386474609375, 0.771728515625, 0.8048095703125, 0.837890625, 0.8709716796875, 0.904052734375, 0.9371337890625, 0.97021484375, 1.0032958984375, 1.036376953125, 1.0694580078125, 1.1025390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 12.0, 10.0, 4.0, 19.0, 14.0, 19.0, 26.0, 18.0, 22.0, 22.0, 31.0, 33.0, 40.0, 27.0, 58.0, 29.0, 48.0, 49.0, 39.0, 30.0, 42.0, 43.0, 41.0, 36.0, 37.0, 37.0, 33.0, 18.0, 21.0, 21.0, 15.0, 24.0, 13.0, 15.0, 13.0, 6.0, 6.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.38033676147461, -53.55709457397461, -51.73385238647461, -49.91061019897461, -48.08736801147461, -46.26412582397461, -44.440887451171875, -42.617645263671875, -40.794403076171875, -38.971160888671875, -37.147918701171875, -35.324676513671875, -33.501434326171875, -31.678192138671875, -29.854951858520508, -28.031709671020508, -26.208465576171875, -24.385223388671875, -22.561981201171875, -20.738739013671875, -18.915496826171875, -17.092254638671875, -15.269014358520508, -13.445772171020508, -11.622529983520508, -9.799287796020508, -7.976046085357666, -6.152804374694824, -4.329562187194824, -2.506319999694824, -0.6830787658691406, 1.1401634216308594, 2.9634056091308594, 4.786647796630859, 6.609889507293701, 8.433131217956543, 10.256373405456543, 12.079615592956543, 13.902856826782227, 15.726099014282227, 17.549341201782227, 19.372583389282227, 21.195825576782227, 23.019065856933594, 24.842308044433594, 26.665550231933594, 28.488792419433594, 30.312034606933594, 32.135276794433594, 33.958518981933594, 35.781761169433594, 37.605003356933594, 39.428245544433594, 41.251487731933594, 43.074729919433594, 44.897972106933594, 46.721214294433594, 48.544456481933594, 50.367698669433594, 52.190940856933594, 54.014183044433594, 55.837425231933594, 57.660667419433594, 59.483909606933594, 61.30714797973633]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 10.0, 9.0, 12.0, 14.0, 18.0, 15.0, 22.0, 21.0, 19.0, 26.0, 34.0, 48.0, 34.0, 50.0, 49.0, 50.0, 53.0, 45.0, 57.0, 53.0, 32.0, 40.0, 24.0, 36.0, 36.0, 33.0, 13.0, 21.0, 27.0, 21.0, 18.0, 12.0, 14.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.64140319824219, -66.4472427368164, -64.25308227539062, -62.058921813964844, -59.86476135253906, -57.67060089111328, -55.4764404296875, -53.28227996826172, -51.08811950683594, -48.893959045410156, -46.699798583984375, -44.505638122558594, -42.31147766113281, -40.11731719970703, -37.92315673828125, -35.72899627685547, -33.53483581542969, -31.340675354003906, -29.146514892578125, -26.952354431152344, -24.758193969726562, -22.56403350830078, -20.369873046875, -18.17571258544922, -15.981552124023438, -13.787391662597656, -11.593231201171875, -9.399070739746094, -7.2049102783203125, -5.010749816894531, -2.81658935546875, -0.6224288940429688, 1.5717391967773438, 3.765899658203125, 5.960060119628906, 8.154220581054688, 10.348381042480469, 12.54254150390625, 14.736701965332031, 16.930862426757812, 19.125022888183594, 21.319183349609375, 23.513343811035156, 25.707504272460938, 27.90166473388672, 30.0958251953125, 32.28998565673828, 34.48414611816406, 36.678306579589844, 38.872467041015625, 41.066627502441406, 43.26078796386719, 45.45494842529297, 47.64910888671875, 49.84326934814453, 52.03742980957031, 54.231590270996094, 56.425750732421875, 58.619911193847656, 60.81407165527344, 63.00823211669922, 65.202392578125, 67.39655303955078, 69.59071350097656, 71.78487396240234]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 13.0, 24.0, 25.0, 29.0, 46.0, 90.0, 129.0, 212.0, 346.0, 580.0, 894.0, 1339.0, 2063.0, 3184.0, 4697.0, 7297.0, 10661.0, 15494.0, 21968.0, 30123.0, 40381.0, 51593.0, 63610.0, 75477.0, 84733.0, 90799.0, 91530.0, 88087.0, 79538.0, 68016.0, 56747.0, 44721.0, 34137.0, 24851.0, 17738.0, 12511.0, 8646.0, 5731.0, 3692.0, 2449.0, 1595.0, 1008.0, 651.0, 409.0, 247.0, 160.0, 125.0, 63.0, 37.0, 18.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0], "bins": [-42.40625, -41.12890625, -39.8515625, -38.57421875, -37.296875, -36.01953125, -34.7421875, -33.46484375, -32.1875, -30.91015625, -29.6328125, -28.35546875, -27.078125, -25.80078125, -24.5234375, -23.24609375, -21.96875, -20.69140625, -19.4140625, -18.13671875, -16.859375, -15.58203125, -14.3046875, -13.02734375, -11.75, -10.47265625, -9.1953125, -7.91796875, -6.640625, -5.36328125, -4.0859375, -2.80859375, -1.53125, -0.25390625, 1.0234375, 2.30078125, 3.578125, 4.85546875, 6.1328125, 7.41015625, 8.6875, 9.96484375, 11.2421875, 12.51953125, 13.796875, 15.07421875, 16.3515625, 17.62890625, 18.90625, 20.18359375, 21.4609375, 22.73828125, 24.015625, 25.29296875, 26.5703125, 27.84765625, 29.125, 30.40234375, 31.6796875, 32.95703125, 34.234375, 35.51171875, 36.7890625, 38.06640625, 39.34375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 14.0, 9.0, 12.0, 11.0, 21.0, 8.0, 23.0, 23.0, 20.0, 23.0, 34.0, 44.0, 41.0, 44.0, 52.0, 48.0, 54.0, 48.0, 54.0, 47.0, 40.0, 38.0, 26.0, 37.0, 37.0, 31.0, 15.0, 23.0, 24.0, 20.0, 21.0, 10.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.322265625, -62.20703125, -60.091796875, -57.9765625, -55.861328125, -53.74609375, -51.630859375, -49.515625, -47.400390625, -45.28515625, -43.169921875, -41.0546875, -38.939453125, -36.82421875, -34.708984375, -32.59375, -30.478515625, -28.36328125, -26.248046875, -24.1328125, -22.017578125, -19.90234375, -17.787109375, -15.671875, -13.556640625, -11.44140625, -9.326171875, -7.2109375, -5.095703125, -2.98046875, -0.865234375, 1.25, 3.365234375, 5.48046875, 7.595703125, 9.7109375, 11.826171875, 13.94140625, 16.056640625, 18.171875, 20.287109375, 22.40234375, 24.517578125, 26.6328125, 28.748046875, 30.86328125, 32.978515625, 35.09375, 37.208984375, 39.32421875, 41.439453125, 43.5546875, 45.669921875, 47.78515625, 49.900390625, 52.015625, 54.130859375, 56.24609375, 58.361328125, 60.4765625, 62.591796875, 64.70703125, 66.822265625, 68.9375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 21.0, 29.0, 53.0, 77.0, 118.0, 225.0, 288.0, 487.0, 761.0, 1279.0, 1951.0, 3001.0, 4818.0, 7415.0, 11288.0, 16811.0, 24220.0, 34115.0, 46992.0, 61471.0, 76301.0, 88742.0, 98193.0, 100575.0, 97178.0, 87484.0, 74515.0, 59920.0, 46068.0, 33728.0, 23543.0, 16018.0, 10990.0, 7156.0, 4562.0, 3006.0, 1872.0, 1176.0, 814.0, 470.0, 318.0, 178.0, 99.0, 78.0, 49.0, 34.0, 22.0, 9.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-43.53125, -42.1474609375, -40.763671875, -39.3798828125, -37.99609375, -36.6123046875, -35.228515625, -33.8447265625, -32.4609375, -31.0771484375, -29.693359375, -28.3095703125, -26.92578125, -25.5419921875, -24.158203125, -22.7744140625, -21.390625, -20.0068359375, -18.623046875, -17.2392578125, -15.85546875, -14.4716796875, -13.087890625, -11.7041015625, -10.3203125, -8.9365234375, -7.552734375, -6.1689453125, -4.78515625, -3.4013671875, -2.017578125, -0.6337890625, 0.75, 2.1337890625, 3.517578125, 4.9013671875, 6.28515625, 7.6689453125, 9.052734375, 10.4365234375, 11.8203125, 13.2041015625, 14.587890625, 15.9716796875, 17.35546875, 18.7392578125, 20.123046875, 21.5068359375, 22.890625, 24.2744140625, 25.658203125, 27.0419921875, 28.42578125, 29.8095703125, 31.193359375, 32.5771484375, 33.9609375, 35.3447265625, 36.728515625, 38.1123046875, 39.49609375, 40.8798828125, 42.263671875, 43.6474609375, 45.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 5.0, 6.0, 12.0, 19.0, 14.0, 23.0, 25.0, 38.0, 35.0, 36.0, 49.0, 45.0, 55.0, 59.0, 54.0, 54.0, 52.0, 45.0, 49.0, 44.0, 34.0, 40.0, 45.0, 39.0, 22.0, 18.0, 14.0, 16.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.71875, -50.111328125, -48.50390625, -46.896484375, -45.2890625, -43.681640625, -42.07421875, -40.466796875, -38.859375, -37.251953125, -35.64453125, -34.037109375, -32.4296875, -30.822265625, -29.21484375, -27.607421875, -26.0, -24.392578125, -22.78515625, -21.177734375, -19.5703125, -17.962890625, -16.35546875, -14.748046875, -13.140625, -11.533203125, -9.92578125, -8.318359375, -6.7109375, -5.103515625, -3.49609375, -1.888671875, -0.28125, 1.326171875, 2.93359375, 4.541015625, 6.1484375, 7.755859375, 9.36328125, 10.970703125, 12.578125, 14.185546875, 15.79296875, 17.400390625, 19.0078125, 20.615234375, 22.22265625, 23.830078125, 25.4375, 27.044921875, 28.65234375, 30.259765625, 31.8671875, 33.474609375, 35.08203125, 36.689453125, 38.296875, 39.904296875, 41.51171875, 43.119140625, 44.7265625, 46.333984375, 47.94140625, 49.548828125, 51.15625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 38.0, 58.0, 85.0, 132.0, 235.0, 315.0, 513.0, 913.0, 1517.0, 2534.0, 4281.0, 6962.0, 11518.0, 18253.0, 28655.0, 43167.0, 62105.0, 83495.0, 103356.0, 118686.0, 122406.0, 113826.0, 96462.0, 74870.0, 53835.0, 36811.0, 24170.0, 15287.0, 9507.0, 5800.0, 3416.0, 2143.0, 1209.0, 730.0, 462.0, 278.0, 179.0, 109.0, 67.0, 41.0, 28.0, 21.0, 13.0, 9.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.15869140625, -18.5048828125, -17.85107421875, -17.197265625, -16.54345703125, -15.8896484375, -15.23583984375, -14.58203125, -13.92822265625, -13.2744140625, -12.62060546875, -11.966796875, -11.31298828125, -10.6591796875, -10.00537109375, -9.3515625, -8.69775390625, -8.0439453125, -7.39013671875, -6.736328125, -6.08251953125, -5.4287109375, -4.77490234375, -4.12109375, -3.46728515625, -2.8134765625, -2.15966796875, -1.505859375, -0.85205078125, -0.1982421875, 0.45556640625, 1.109375, 1.76318359375, 2.4169921875, 3.07080078125, 3.724609375, 4.37841796875, 5.0322265625, 5.68603515625, 6.33984375, 6.99365234375, 7.6474609375, 8.30126953125, 8.955078125, 9.60888671875, 10.2626953125, 10.91650390625, 11.5703125, 12.22412109375, 12.8779296875, 13.53173828125, 14.185546875, 14.83935546875, 15.4931640625, 16.14697265625, 16.80078125, 17.45458984375, 18.1083984375, 18.76220703125, 19.416015625, 20.06982421875, 20.7236328125, 21.37744140625, 22.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 10.0, 5.0, 15.0, 14.0, 11.0, 18.0, 24.0, 28.0, 26.0, 32.0, 33.0, 38.0, 45.0, 46.0, 48.0, 53.0, 48.0, 47.0, 47.0, 39.0, 43.0, 50.0, 37.0, 36.0, 20.0, 31.0, 23.0, 22.0, 20.0, 9.0, 11.0, 10.0, 8.0, 5.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.002513885498046875, -0.002439558506011963, -0.0023652315139770508, -0.0022909045219421387, -0.0022165775299072266, -0.0021422505378723145, -0.0020679235458374023, -0.0019935965538024902, -0.0019192695617675781, -0.001844942569732666, -0.001770615577697754, -0.0016962885856628418, -0.0016219615936279297, -0.0015476346015930176, -0.0014733076095581055, -0.0013989806175231934, -0.0013246536254882812, -0.0012503266334533691, -0.001175999641418457, -0.001101672649383545, -0.0010273456573486328, -0.0009530186653137207, -0.0008786916732788086, -0.0008043646812438965, -0.0007300376892089844, -0.0006557106971740723, -0.0005813837051391602, -0.000507056713104248, -0.00043272972106933594, -0.00035840272903442383, -0.0002840757369995117, -0.0002097487449645996, -0.0001354217529296875, -6.109476089477539e-05, 1.3232231140136719e-05, 8.755922317504883e-05, 0.00016188621520996094, 0.00023621320724487305, 0.00031054019927978516, 0.00038486719131469727, 0.0004591941833496094, 0.0005335211753845215, 0.0006078481674194336, 0.0006821751594543457, 0.0007565021514892578, 0.0008308291435241699, 0.000905156135559082, 0.0009794831275939941, 0.0010538101196289062, 0.0011281371116638184, 0.0012024641036987305, 0.0012767910957336426, 0.0013511180877685547, 0.0014254450798034668, 0.001499772071838379, 0.001574099063873291, 0.0016484260559082031, 0.0017227530479431152, 0.0017970800399780273, 0.0018714070320129395, 0.0019457340240478516, 0.0020200610160827637, 0.0020943880081176758, 0.002168715000152588, 0.0022430419921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 12.0, 30.0, 42.0, 66.0, 78.0, 140.0, 184.0, 326.0, 497.0, 731.0, 1142.0, 1761.0, 2695.0, 4207.0, 6469.0, 9805.0, 14688.0, 21966.0, 32010.0, 44478.0, 60519.0, 77594.0, 93598.0, 104777.0, 108160.0, 103839.0, 91634.0, 74998.0, 58021.0, 42679.0, 30336.0, 20854.0, 14099.0, 8991.0, 5948.0, 3856.0, 2576.0, 1673.0, 1083.0, 725.0, 426.0, 284.0, 183.0, 115.0, 88.0, 61.0, 28.0, 24.0, 11.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-19.265625, -18.652587890625, -18.03955078125, -17.426513671875, -16.8134765625, -16.200439453125, -15.58740234375, -14.974365234375, -14.361328125, -13.748291015625, -13.13525390625, -12.522216796875, -11.9091796875, -11.296142578125, -10.68310546875, -10.070068359375, -9.45703125, -8.843994140625, -8.23095703125, -7.617919921875, -7.0048828125, -6.391845703125, -5.77880859375, -5.165771484375, -4.552734375, -3.939697265625, -3.32666015625, -2.713623046875, -2.1005859375, -1.487548828125, -0.87451171875, -0.261474609375, 0.3515625, 0.964599609375, 1.57763671875, 2.190673828125, 2.8037109375, 3.416748046875, 4.02978515625, 4.642822265625, 5.255859375, 5.868896484375, 6.48193359375, 7.094970703125, 7.7080078125, 8.321044921875, 8.93408203125, 9.547119140625, 10.16015625, 10.773193359375, 11.38623046875, 11.999267578125, 12.6123046875, 13.225341796875, 13.83837890625, 14.451416015625, 15.064453125, 15.677490234375, 16.29052734375, 16.903564453125, 17.5166015625, 18.129638671875, 18.74267578125, 19.355712890625, 19.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 2.0, 14.0, 12.0, 4.0, 17.0, 28.0, 26.0, 20.0, 24.0, 37.0, 47.0, 45.0, 42.0, 53.0, 50.0, 54.0, 48.0, 43.0, 54.0, 45.0, 38.0, 41.0, 42.0, 29.0, 27.0, 25.0, 24.0, 19.0, 21.0, 11.0, 9.0, 12.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-10.4375, -10.1297607421875, -9.822021484375, -9.5142822265625, -9.20654296875, -8.8988037109375, -8.591064453125, -8.2833251953125, -7.9755859375, -7.6678466796875, -7.360107421875, -7.0523681640625, -6.74462890625, -6.4368896484375, -6.129150390625, -5.8214111328125, -5.513671875, -5.2059326171875, -4.898193359375, -4.5904541015625, -4.28271484375, -3.9749755859375, -3.667236328125, -3.3594970703125, -3.0517578125, -2.7440185546875, -2.436279296875, -2.1285400390625, -1.82080078125, -1.5130615234375, -1.205322265625, -0.8975830078125, -0.58984375, -0.2821044921875, 0.025634765625, 0.3333740234375, 0.64111328125, 0.9488525390625, 1.256591796875, 1.5643310546875, 1.8720703125, 2.1798095703125, 2.487548828125, 2.7952880859375, 3.10302734375, 3.4107666015625, 3.718505859375, 4.0262451171875, 4.333984375, 4.6417236328125, 4.949462890625, 5.2572021484375, 5.56494140625, 5.8726806640625, 6.180419921875, 6.4881591796875, 6.7958984375, 7.1036376953125, 7.411376953125, 7.7191162109375, 8.02685546875, 8.3345947265625, 8.642333984375, 8.9500732421875, 9.2578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 13.0, 18.0, 10.0, 22.0, 17.0, 22.0, 24.0, 24.0, 26.0, 24.0, 32.0, 29.0, 33.0, 30.0, 34.0, 45.0, 39.0, 37.0, 33.0, 41.0, 29.0, 41.0, 35.0, 30.0, 32.0, 28.0, 22.0, 19.0, 14.0, 25.0, 15.0, 18.0, 13.0, 16.0, 11.0, 20.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.57626724243164, -46.00093078613281, -44.425594329833984, -42.850257873535156, -41.274925231933594, -39.699588775634766, -38.12425231933594, -36.54891586303711, -34.97357940673828, -33.39824295043945, -31.822908401489258, -30.24757194519043, -28.6722354888916, -27.096900939941406, -25.521564483642578, -23.94622802734375, -22.370893478393555, -20.795557022094727, -19.22022247314453, -17.644886016845703, -16.069549560546875, -14.494214057922363, -12.918878555297852, -11.343542098999023, -9.768206596374512, -8.19287109375, -6.617534637451172, -5.04219913482666, -3.4668631553649902, -1.8915271759033203, -0.3161916732788086, 1.2591447830200195, 2.8344802856445312, 4.409816265106201, 5.985152244567871, 7.560487747192383, 9.135824203491211, 10.711159706115723, 12.286495208740234, 13.861831665039062, 15.437167167663574, 17.012502670288086, 18.587839126586914, 20.16317367553711, 21.738510131835938, 23.313846588134766, 24.889183044433594, 26.464519500732422, 28.039854049682617, 29.615190505981445, 31.19052505493164, 32.76586151123047, 34.3411979675293, 35.916534423828125, 37.49186706542969, 39.06720733642578, 40.642539978027344, 42.21787643432617, 43.793212890625, 45.36854553222656, 46.94388198852539, 48.51921844482422, 50.09455490112305, 51.669891357421875, 53.2452278137207]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 10.0, 14.0, 10.0, 18.0, 14.0, 16.0, 34.0, 18.0, 31.0, 32.0, 37.0, 30.0, 41.0, 38.0, 44.0, 37.0, 34.0, 56.0, 47.0, 50.0, 33.0, 41.0, 41.0, 37.0, 37.0, 24.0, 25.0, 20.0, 18.0, 15.0, 16.0, 9.0, 11.0, 8.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.180599212646484, -61.082515716552734, -58.984432220458984, -56.8863525390625, -54.78826904296875, -52.690185546875, -50.59210205078125, -48.4940185546875, -46.39593505859375, -44.2978515625, -42.19976806640625, -40.1016845703125, -38.003604888916016, -35.905521392822266, -33.807437896728516, -31.709354400634766, -29.61127471923828, -27.51319122314453, -25.415109634399414, -23.317026138305664, -21.218944549560547, -19.120861053466797, -17.022777557373047, -14.924695014953613, -12.82661247253418, -10.728529930114746, -8.630447387695312, -6.5323638916015625, -4.434281349182129, -2.3361988067626953, -0.2381153106689453, 1.8599672317504883, 3.9580459594726562, 6.05612850189209, 8.154211044311523, 10.252294540405273, 12.350377082824707, 14.44845962524414, 16.54654312133789, 18.64462661743164, 20.742708206176758, 22.840791702270508, 24.938873291015625, 27.036956787109375, 29.135040283203125, 31.233121871948242, 33.331207275390625, 35.42928695678711, 37.52737045288086, 39.62545394897461, 41.72353744506836, 43.821617126464844, 45.919700622558594, 48.017784118652344, 50.115867614746094, 52.213951110839844, 54.312034606933594, 56.410118103027344, 58.508201599121094, 60.606285095214844, 62.70436477661133, 64.80244445800781, 66.90052795410156, 68.99861145019531, 71.09669494628906]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 21.0, 38.0, 60.0, 101.0, 162.0, 283.0, 471.0, 759.0, 1238.0, 2002.0, 3271.0, 5274.0, 8580.0, 13781.0, 21449.0, 33350.0, 50604.0, 75652.0, 111510.0, 158367.0, 216735.0, 281654.0, 346194.0, 398288.0, 424198.0, 419881.0, 385390.0, 328748.0, 263344.0, 199960.0, 144467.0, 101911.0, 68613.0, 45374.0, 30139.0, 19355.0, 12284.0, 7931.0, 4881.0, 3061.0, 1855.0, 1169.0, 733.0, 429.0, 265.0, 168.0, 96.0, 67.0, 42.0, 28.0, 12.0, 11.0, 8.0, 5.0, 3.0, 0.0, 3.0], "bins": [-43.1875, -41.83251953125, -40.4775390625, -39.12255859375, -37.767578125, -36.41259765625, -35.0576171875, -33.70263671875, -32.34765625, -30.99267578125, -29.6376953125, -28.28271484375, -26.927734375, -25.57275390625, -24.2177734375, -22.86279296875, -21.5078125, -20.15283203125, -18.7978515625, -17.44287109375, -16.087890625, -14.73291015625, -13.3779296875, -12.02294921875, -10.66796875, -9.31298828125, -7.9580078125, -6.60302734375, -5.248046875, -3.89306640625, -2.5380859375, -1.18310546875, 0.171875, 1.52685546875, 2.8818359375, 4.23681640625, 5.591796875, 6.94677734375, 8.3017578125, 9.65673828125, 11.01171875, 12.36669921875, 13.7216796875, 15.07666015625, 16.431640625, 17.78662109375, 19.1416015625, 20.49658203125, 21.8515625, 23.20654296875, 24.5615234375, 25.91650390625, 27.271484375, 28.62646484375, 29.9814453125, 31.33642578125, 32.69140625, 34.04638671875, 35.4013671875, 36.75634765625, 38.111328125, 39.46630859375, 40.8212890625, 42.17626953125, 43.53125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 6.0, 6.0, 11.0, 13.0, 11.0, 18.0, 13.0, 22.0, 30.0, 25.0, 35.0, 29.0, 30.0, 31.0, 47.0, 38.0, 38.0, 31.0, 45.0, 52.0, 45.0, 48.0, 40.0, 43.0, 33.0, 37.0, 33.0, 27.0, 21.0, 18.0, 19.0, 19.0, 13.0, 11.0, 6.0, 9.0, 8.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.1796875, -52.359375, -50.5390625, -48.71875, -46.8984375, -45.078125, -43.2578125, -41.4375, -39.6171875, -37.796875, -35.9765625, -34.15625, -32.3359375, -30.515625, -28.6953125, -26.875, -25.0546875, -23.234375, -21.4140625, -19.59375, -17.7734375, -15.953125, -14.1328125, -12.3125, -10.4921875, -8.671875, -6.8515625, -5.03125, -3.2109375, -1.390625, 0.4296875, 2.25, 4.0703125, 5.890625, 7.7109375, 9.53125, 11.3515625, 13.171875, 14.9921875, 16.8125, 18.6328125, 20.453125, 22.2734375, 24.09375, 25.9140625, 27.734375, 29.5546875, 31.375, 33.1953125, 35.015625, 36.8359375, 38.65625, 40.4765625, 42.296875, 44.1171875, 45.9375, 47.7578125, 49.578125, 51.3984375, 53.21875, 55.0390625, 56.859375, 58.6796875, 60.5]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 27.0, 33.0, 53.0, 102.0, 169.0, 323.0, 490.0, 890.0, 1513.0, 2478.0, 4184.0, 6783.0, 11356.0, 18283.0, 28719.0, 44732.0, 66945.0, 97496.0, 139459.0, 190665.0, 248387.0, 307323.0, 359410.0, 395469.0, 406839.0, 390484.0, 354055.0, 297747.0, 238975.0, 181915.0, 132655.0, 92836.0, 62686.0, 41319.0, 26673.0, 16537.0, 10394.0, 6355.0, 3792.0, 2358.0, 1380.0, 840.0, 486.0, 270.0, 167.0, 79.0, 71.0, 32.0, 18.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.9375, -42.4931640625, -41.048828125, -39.6044921875, -38.16015625, -36.7158203125, -35.271484375, -33.8271484375, -32.3828125, -30.9384765625, -29.494140625, -28.0498046875, -26.60546875, -25.1611328125, -23.716796875, -22.2724609375, -20.828125, -19.3837890625, -17.939453125, -16.4951171875, -15.05078125, -13.6064453125, -12.162109375, -10.7177734375, -9.2734375, -7.8291015625, -6.384765625, -4.9404296875, -3.49609375, -2.0517578125, -0.607421875, 0.8369140625, 2.28125, 3.7255859375, 5.169921875, 6.6142578125, 8.05859375, 9.5029296875, 10.947265625, 12.3916015625, 13.8359375, 15.2802734375, 16.724609375, 18.1689453125, 19.61328125, 21.0576171875, 22.501953125, 23.9462890625, 25.390625, 26.8349609375, 28.279296875, 29.7236328125, 31.16796875, 32.6123046875, 34.056640625, 35.5009765625, 36.9453125, 38.3896484375, 39.833984375, 41.2783203125, 42.72265625, 44.1669921875, 45.611328125, 47.0556640625, 48.5]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 14.0, 20.0, 18.0, 35.0, 29.0, 54.0, 55.0, 95.0, 90.0, 120.0, 142.0, 150.0, 163.0, 201.0, 207.0, 246.0, 215.0, 253.0, 220.0, 253.0, 204.0, 203.0, 176.0, 169.0, 151.0, 109.0, 111.0, 89.0, 66.0, 58.0, 38.0, 36.0, 22.0, 11.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.948974609375, -28.00732421875, -27.065673828125, -26.1240234375, -25.182373046875, -24.24072265625, -23.299072265625, -22.357421875, -21.415771484375, -20.47412109375, -19.532470703125, -18.5908203125, -17.649169921875, -16.70751953125, -15.765869140625, -14.82421875, -13.882568359375, -12.94091796875, -11.999267578125, -11.0576171875, -10.115966796875, -9.17431640625, -8.232666015625, -7.291015625, -6.349365234375, -5.40771484375, -4.466064453125, -3.5244140625, -2.582763671875, -1.64111328125, -0.699462890625, 0.2421875, 1.183837890625, 2.12548828125, 3.067138671875, 4.0087890625, 4.950439453125, 5.89208984375, 6.833740234375, 7.775390625, 8.717041015625, 9.65869140625, 10.600341796875, 11.5419921875, 12.483642578125, 13.42529296875, 14.366943359375, 15.30859375, 16.250244140625, 17.19189453125, 18.133544921875, 19.0751953125, 20.016845703125, 20.95849609375, 21.900146484375, 22.841796875, 23.783447265625, 24.72509765625, 25.666748046875, 26.6083984375, 27.550048828125, 28.49169921875, 29.433349609375, 30.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 7.0, 7.0, 16.0, 9.0, 12.0, 23.0, 21.0, 26.0, 23.0, 24.0, 30.0, 44.0, 38.0, 42.0, 41.0, 38.0, 41.0, 36.0, 45.0, 33.0, 36.0, 40.0, 41.0, 28.0, 27.0, 29.0, 24.0, 33.0, 28.0, 16.0, 10.0, 15.0, 21.0, 15.0, 14.0, 9.0, 5.0, 7.0, 6.0, 3.0, 8.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.45366668701172, -50.6524772644043, -48.85129165649414, -47.05010223388672, -45.2489128112793, -43.447723388671875, -41.64653778076172, -39.8453483581543, -38.044158935546875, -36.24296951293945, -34.4417839050293, -32.640594482421875, -30.839405059814453, -29.038217544555664, -27.237030029296875, -25.435840606689453, -23.634653091430664, -21.833465576171875, -20.032276153564453, -18.231088638305664, -16.429899215698242, -14.628711700439453, -12.827523231506348, -11.026334762573242, -9.225146293640137, -7.423957824707031, -5.622769355773926, -3.8215813636779785, -2.020392894744873, -0.21920490264892578, 1.5819835662841797, 3.383172035217285, 5.184360504150391, 6.985548973083496, 8.786737442016602, 10.58792495727539, 12.389114379882812, 14.190301895141602, 15.991490364074707, 17.792678833007812, 19.593868255615234, 21.395055770874023, 23.196245193481445, 24.997432708740234, 26.798622131347656, 28.599809646606445, 30.400997161865234, 32.202186584472656, 34.00337219238281, 35.804561614990234, 37.60574722290039, 39.40693664550781, 41.208126068115234, 43.009315490722656, 44.81050109863281, 46.611690521240234, 48.412879943847656, 50.21406936645508, 52.015254974365234, 53.816444396972656, 55.61763381958008, 57.4188232421875, 59.220008850097656, 61.02119827270508, 62.8223876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 7.0, 11.0, 12.0, 12.0, 19.0, 18.0, 19.0, 16.0, 23.0, 33.0, 36.0, 30.0, 36.0, 27.0, 40.0, 47.0, 36.0, 43.0, 28.0, 33.0, 48.0, 46.0, 33.0, 38.0, 43.0, 28.0, 31.0, 31.0, 23.0, 26.0, 15.0, 13.0, 13.0, 13.0, 9.0, 11.0, 8.0, 5.0, 9.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.35512924194336, -57.40300750732422, -55.45088195800781, -53.49876022338867, -51.54663848876953, -49.594512939453125, -47.642391204833984, -45.690269470214844, -43.73814392089844, -41.7860221862793, -39.83389663696289, -37.88177490234375, -35.92965316772461, -33.97753143310547, -32.02540588378906, -30.073284149169922, -28.12116241455078, -26.169038772583008, -24.216917037963867, -22.264793395996094, -20.312671661376953, -18.36054801940918, -16.408424377441406, -14.45630168914795, -12.504179000854492, -10.552056312561035, -8.599933624267578, -6.647809982299805, -4.695687294006348, -2.7435646057128906, -0.7914409637451172, 1.1606817245483398, 3.1128082275390625, 5.0649309158325195, 7.017054080963135, 8.96917724609375, 10.921299934387207, 12.873422622680664, 14.825546264648438, 16.777667999267578, 18.72979164123535, 20.681915283203125, 22.634037017822266, 24.58616065979004, 26.538284301757812, 28.490406036376953, 30.442529678344727, 32.3946533203125, 34.34677505493164, 36.29889678955078, 38.25102233886719, 40.20314407348633, 42.15526580810547, 44.107391357421875, 46.059513092041016, 48.011634826660156, 49.96376037597656, 51.9158821105957, 53.86800765991211, 55.82012939453125, 57.77225112915039, 59.72437286376953, 61.67649841308594, 63.62862014770508, 65.58074188232422]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 17.0, 34.0, 60.0, 80.0, 124.0, 213.0, 316.0, 551.0, 890.0, 1403.0, 2415.0, 3822.0, 6190.0, 10068.0, 15631.0, 24099.0, 36110.0, 52881.0, 73214.0, 95966.0, 115330.0, 124420.0, 119704.0, 103653.0, 81756.0, 59845.0, 41990.0, 28283.0, 18457.0, 11608.0, 7405.0, 4586.0, 2902.0, 1713.0, 1056.0, 696.0, 404.0, 228.0, 166.0, 79.0, 68.0, 36.0, 27.0, 20.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.70947265625, -13.2626953125, -12.81591796875, -12.369140625, -11.92236328125, -11.4755859375, -11.02880859375, -10.58203125, -10.13525390625, -9.6884765625, -9.24169921875, -8.794921875, -8.34814453125, -7.9013671875, -7.45458984375, -7.0078125, -6.56103515625, -6.1142578125, -5.66748046875, -5.220703125, -4.77392578125, -4.3271484375, -3.88037109375, -3.43359375, -2.98681640625, -2.5400390625, -2.09326171875, -1.646484375, -1.19970703125, -0.7529296875, -0.30615234375, 0.140625, 0.58740234375, 1.0341796875, 1.48095703125, 1.927734375, 2.37451171875, 2.8212890625, 3.26806640625, 3.71484375, 4.16162109375, 4.6083984375, 5.05517578125, 5.501953125, 5.94873046875, 6.3955078125, 6.84228515625, 7.2890625, 7.73583984375, 8.1826171875, 8.62939453125, 9.076171875, 9.52294921875, 9.9697265625, 10.41650390625, 10.86328125, 11.31005859375, 11.7568359375, 12.20361328125, 12.650390625, 13.09716796875, 13.5439453125, 13.99072265625, 14.4375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 11.0, 10.0, 13.0, 18.0, 19.0, 20.0, 17.0, 18.0, 39.0, 35.0, 30.0, 35.0, 28.0, 39.0, 47.0, 40.0, 38.0, 29.0, 35.0, 48.0, 45.0, 39.0, 31.0, 44.0, 30.0, 31.0, 29.0, 26.0, 22.0, 18.0, 12.0, 14.0, 11.0, 10.0, 11.0, 8.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.65625, -57.69384765625, -55.7314453125, -53.76904296875, -51.806640625, -49.84423828125, -47.8818359375, -45.91943359375, -43.95703125, -41.99462890625, -40.0322265625, -38.06982421875, -36.107421875, -34.14501953125, -32.1826171875, -30.22021484375, -28.2578125, -26.29541015625, -24.3330078125, -22.37060546875, -20.408203125, -18.44580078125, -16.4833984375, -14.52099609375, -12.55859375, -10.59619140625, -8.6337890625, -6.67138671875, -4.708984375, -2.74658203125, -0.7841796875, 1.17822265625, 3.140625, 5.10302734375, 7.0654296875, 9.02783203125, 10.990234375, 12.95263671875, 14.9150390625, 16.87744140625, 18.83984375, 20.80224609375, 22.7646484375, 24.72705078125, 26.689453125, 28.65185546875, 30.6142578125, 32.57666015625, 34.5390625, 36.50146484375, 38.4638671875, 40.42626953125, 42.388671875, 44.35107421875, 46.3134765625, 48.27587890625, 50.23828125, 52.20068359375, 54.1630859375, 56.12548828125, 58.087890625, 60.05029296875, 62.0126953125, 63.97509765625, 65.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 4.0, 5.0, 4.0, 3.0, 11.0, 7.0, 14.0, 24.0, 20.0, 39.0, 59.0, 87.0, 108.0, 163.0, 240.0, 439.0, 639.0, 1174.0, 1999.0, 3646.0, 6865.0, 13202.0, 26368.0, 129229.0, 792977.0, 35183.0, 16627.0, 8642.0, 4587.0, 2511.0, 1422.0, 845.0, 502.0, 306.0, 185.0, 131.0, 81.0, 50.0, 46.0, 31.0, 27.0, 16.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-60.625, -58.7412109375, -56.857421875, -54.9736328125, -53.08984375, -51.2060546875, -49.322265625, -47.4384765625, -45.5546875, -43.6708984375, -41.787109375, -39.9033203125, -38.01953125, -36.1357421875, -34.251953125, -32.3681640625, -30.484375, -28.6005859375, -26.716796875, -24.8330078125, -22.94921875, -21.0654296875, -19.181640625, -17.2978515625, -15.4140625, -13.5302734375, -11.646484375, -9.7626953125, -7.87890625, -5.9951171875, -4.111328125, -2.2275390625, -0.34375, 1.5400390625, 3.423828125, 5.3076171875, 7.19140625, 9.0751953125, 10.958984375, 12.8427734375, 14.7265625, 16.6103515625, 18.494140625, 20.3779296875, 22.26171875, 24.1455078125, 26.029296875, 27.9130859375, 29.796875, 31.6806640625, 33.564453125, 35.4482421875, 37.33203125, 39.2158203125, 41.099609375, 42.9833984375, 44.8671875, 46.7509765625, 48.634765625, 50.5185546875, 52.40234375, 54.2861328125, 56.169921875, 58.0537109375, 59.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 9.0, 6.0, 12.0, 8.0, 12.0, 10.0, 9.0, 14.0, 21.0, 21.0, 30.0, 26.0, 38.0, 43.0, 35.0, 37.0, 32.0, 52.0, 44.0, 42.0, 45.0, 40.0, 45.0, 48.0, 34.0, 34.0, 31.0, 35.0, 18.0, 28.0, 18.0, 20.0, 15.0, 15.0, 17.0, 9.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25, -42.8720703125, -41.494140625, -40.1162109375, -38.73828125, -37.3603515625, -35.982421875, -34.6044921875, -33.2265625, -31.8486328125, -30.470703125, -29.0927734375, -27.71484375, -26.3369140625, -24.958984375, -23.5810546875, -22.203125, -20.8251953125, -19.447265625, -18.0693359375, -16.69140625, -15.3134765625, -13.935546875, -12.5576171875, -11.1796875, -9.8017578125, -8.423828125, -7.0458984375, -5.66796875, -4.2900390625, -2.912109375, -1.5341796875, -0.15625, 1.2216796875, 2.599609375, 3.9775390625, 5.35546875, 6.7333984375, 8.111328125, 9.4892578125, 10.8671875, 12.2451171875, 13.623046875, 15.0009765625, 16.37890625, 17.7568359375, 19.134765625, 20.5126953125, 21.890625, 23.2685546875, 24.646484375, 26.0244140625, 27.40234375, 28.7802734375, 30.158203125, 31.5361328125, 32.9140625, 34.2919921875, 35.669921875, 37.0478515625, 38.42578125, 39.8037109375, 41.181640625, 42.5595703125, 43.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 2.0, 16.0, 13.0, 19.0, 28.0, 33.0, 48.0, 77.0, 89.0, 155.0, 211.0, 281.0, 489.0, 751.0, 1220.0, 2022.0, 3565.0, 5928.0, 10030.0, 18880.0, 38460.0, 779718.0, 126165.0, 26697.0, 14171.0, 7758.0, 4594.0, 2651.0, 1598.0, 953.0, 608.0, 423.0, 267.0, 174.0, 132.0, 93.0, 66.0, 36.0, 34.0, 25.0, 17.0, 16.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.078125, -2.981231689453125, -2.88433837890625, -2.787445068359375, -2.6905517578125, -2.593658447265625, -2.49676513671875, -2.399871826171875, -2.302978515625, -2.206085205078125, -2.10919189453125, -2.012298583984375, -1.9154052734375, -1.818511962890625, -1.72161865234375, -1.624725341796875, -1.52783203125, -1.430938720703125, -1.33404541015625, -1.237152099609375, -1.1402587890625, -1.043365478515625, -0.94647216796875, -0.849578857421875, -0.752685546875, -0.655792236328125, -0.55889892578125, -0.462005615234375, -0.3651123046875, -0.268218994140625, -0.17132568359375, -0.074432373046875, 0.0224609375, 0.119354248046875, 0.21624755859375, 0.313140869140625, 0.4100341796875, 0.506927490234375, 0.60382080078125, 0.700714111328125, 0.797607421875, 0.894500732421875, 0.99139404296875, 1.088287353515625, 1.1851806640625, 1.282073974609375, 1.37896728515625, 1.475860595703125, 1.57275390625, 1.669647216796875, 1.76654052734375, 1.863433837890625, 1.9603271484375, 2.057220458984375, 2.15411376953125, 2.251007080078125, 2.347900390625, 2.444793701171875, 2.54168701171875, 2.638580322265625, 2.7354736328125, 2.832366943359375, 2.92926025390625, 3.026153564453125, 3.123046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 6.0, 11.0, 13.0, 12.0, 15.0, 21.0, 24.0, 40.0, 51.0, 60.0, 60.0, 76.0, 69.0, 48.0, 80.0, 82.0, 57.0, 52.0, 42.0, 32.0, 31.0, 22.0, 10.0, 19.0, 10.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001575946807861328, -0.0001520290970802307, -0.0001464635133743286, -0.00014089792966842651, -0.00013533234596252441, -0.00012976676225662231, -0.00012420117855072021, -0.00011863559484481812, -0.00011307001113891602, -0.00010750442743301392, -0.00010193884372711182, -9.637326002120972e-05, -9.080767631530762e-05, -8.524209260940552e-05, -7.967650890350342e-05, -7.411092519760132e-05, -6.854534149169922e-05, -6.297975778579712e-05, -5.741417407989502e-05, -5.184859037399292e-05, -4.628300666809082e-05, -4.071742296218872e-05, -3.515183925628662e-05, -2.958625555038452e-05, -2.4020671844482422e-05, -1.8455088138580322e-05, -1.2889504432678223e-05, -7.323920726776123e-06, -1.7583370208740234e-06, 3.807246685028076e-06, 9.372830390930176e-06, 1.4938414096832275e-05, 2.0503997802734375e-05, 2.6069581508636475e-05, 3.1635165214538574e-05, 3.7200748920440674e-05, 4.2766332626342773e-05, 4.833191633224487e-05, 5.389750003814697e-05, 5.946308374404907e-05, 6.502866744995117e-05, 7.059425115585327e-05, 7.615983486175537e-05, 8.172541856765747e-05, 8.729100227355957e-05, 9.285658597946167e-05, 9.842216968536377e-05, 0.00010398775339126587, 0.00010955333709716797, 0.00011511892080307007, 0.00012068450450897217, 0.00012625008821487427, 0.00013181567192077637, 0.00013738125562667847, 0.00014294683933258057, 0.00014851242303848267, 0.00015407800674438477, 0.00015964359045028687, 0.00016520917415618896, 0.00017077475786209106, 0.00017634034156799316, 0.00018190592527389526, 0.00018747150897979736, 0.00019303709268569946, 0.00019860267639160156]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 8.0, 8.0, 18.0, 17.0, 34.0, 59.0, 85.0, 115.0, 218.0, 352.0, 536.0, 769.0, 1219.0, 1936.0, 3008.0, 4623.0, 7230.0, 11011.0, 16365.0, 23813.0, 34252.0, 48244.0, 64622.0, 82775.0, 100291.0, 112705.0, 113801.0, 103428.0, 86222.0, 67624.0, 50612.0, 36157.0, 25641.0, 17367.0, 11588.0, 7730.0, 5008.0, 3168.0, 2147.0, 1326.0, 848.0, 578.0, 381.0, 224.0, 153.0, 82.0, 58.0, 41.0, 30.0, 14.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.025390625, -1.95574951171875, -1.8861083984375, -1.81646728515625, -1.746826171875, -1.67718505859375, -1.6075439453125, -1.53790283203125, -1.46826171875, -1.39862060546875, -1.3289794921875, -1.25933837890625, -1.189697265625, -1.12005615234375, -1.0504150390625, -0.98077392578125, -0.9111328125, -0.84149169921875, -0.7718505859375, -0.70220947265625, -0.632568359375, -0.56292724609375, -0.4932861328125, -0.42364501953125, -0.35400390625, -0.28436279296875, -0.2147216796875, -0.14508056640625, -0.075439453125, -0.00579833984375, 0.0638427734375, 0.13348388671875, 0.203125, 0.27276611328125, 0.3424072265625, 0.41204833984375, 0.481689453125, 0.55133056640625, 0.6209716796875, 0.69061279296875, 0.76025390625, 0.82989501953125, 0.8995361328125, 0.96917724609375, 1.038818359375, 1.10845947265625, 1.1781005859375, 1.24774169921875, 1.3173828125, 1.38702392578125, 1.4566650390625, 1.52630615234375, 1.595947265625, 1.66558837890625, 1.7352294921875, 1.80487060546875, 1.87451171875, 1.94415283203125, 2.0137939453125, 2.08343505859375, 2.153076171875, 2.22271728515625, 2.2923583984375, 2.36199951171875, 2.431640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 14.0, 17.0, 19.0, 10.0, 21.0, 29.0, 28.0, 32.0, 40.0, 35.0, 52.0, 36.0, 37.0, 52.0, 46.0, 50.0, 45.0, 42.0, 42.0, 43.0, 53.0, 38.0, 30.0, 22.0, 18.0, 20.0, 27.0, 13.0, 19.0, 10.0, 5.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.103515625, -1.070770263671875, -1.03802490234375, -1.005279541015625, -0.9725341796875, -0.939788818359375, -0.90704345703125, -0.874298095703125, -0.841552734375, -0.808807373046875, -0.77606201171875, -0.743316650390625, -0.7105712890625, -0.677825927734375, -0.64508056640625, -0.612335205078125, -0.57958984375, -0.546844482421875, -0.51409912109375, -0.481353759765625, -0.4486083984375, -0.415863037109375, -0.38311767578125, -0.350372314453125, -0.317626953125, -0.284881591796875, -0.25213623046875, -0.219390869140625, -0.1866455078125, -0.153900146484375, -0.12115478515625, -0.088409423828125, -0.0556640625, -0.022918701171875, 0.00982666015625, 0.042572021484375, 0.0753173828125, 0.108062744140625, 0.14080810546875, 0.173553466796875, 0.206298828125, 0.239044189453125, 0.27178955078125, 0.304534912109375, 0.3372802734375, 0.370025634765625, 0.40277099609375, 0.435516357421875, 0.46826171875, 0.501007080078125, 0.53375244140625, 0.566497802734375, 0.5992431640625, 0.631988525390625, 0.66473388671875, 0.697479248046875, 0.730224609375, 0.762969970703125, 0.79571533203125, 0.828460693359375, 0.8612060546875, 0.893951416015625, 0.92669677734375, 0.959442138671875, 0.9921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 4.0, 9.0, 11.0, 9.0, 13.0, 21.0, 16.0, 15.0, 19.0, 27.0, 26.0, 34.0, 36.0, 38.0, 41.0, 47.0, 31.0, 36.0, 53.0, 29.0, 40.0, 39.0, 42.0, 30.0, 29.0, 28.0, 30.0, 35.0, 26.0, 27.0, 17.0, 8.0, 19.0, 17.0, 19.0, 10.0, 10.0, 5.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.127662658691406, -53.357574462890625, -51.587486267089844, -49.81739807128906, -48.047306060791016, -46.277217864990234, -44.50712966918945, -42.73704147338867, -40.966949462890625, -39.196861267089844, -37.42677307128906, -35.65668487548828, -33.886592864990234, -32.11650466918945, -30.346416473388672, -28.57632827758789, -26.80624008178711, -25.036151885986328, -23.266061782836914, -21.495973587036133, -19.72588348388672, -17.955795288085938, -16.185707092285156, -14.415617942810059, -12.645528793334961, -10.875439643859863, -9.105350494384766, -7.335262298583984, -5.565173149108887, -3.795083999633789, -2.024995803833008, -0.25490665435791016, 1.5151824951171875, 3.285271406173706, 5.055360317230225, 6.825448989868164, 8.595538139343262, 10.36562728881836, 12.13571548461914, 13.905804634094238, 15.675893783569336, 17.445981979370117, 19.21607208251953, 20.986160278320312, 22.756248474121094, 24.526338577270508, 26.29642677307129, 28.066516876220703, 29.836605072021484, 31.606693267822266, 33.37678146362305, 35.146873474121094, 36.916961669921875, 38.687049865722656, 40.45713806152344, 42.22722625732422, 43.997314453125, 45.76740264892578, 47.53749084472656, 49.307579040527344, 51.07767105102539, 52.84775924682617, 54.61784744262695, 56.387935638427734, 58.15802764892578]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 7.0, 11.0, 9.0, 14.0, 17.0, 20.0, 18.0, 20.0, 19.0, 32.0, 40.0, 28.0, 36.0, 26.0, 42.0, 48.0, 38.0, 40.0, 28.0, 37.0, 41.0, 46.0, 41.0, 33.0, 41.0, 34.0, 33.0, 27.0, 27.0, 20.0, 17.0, 13.0, 11.0, 15.0, 11.0, 12.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.02375793457031, -58.05263900756836, -56.08151626586914, -54.11039733886719, -52.13927459716797, -50.168155670166016, -48.19703674316406, -46.225914001464844, -44.25479507446289, -42.28367614746094, -40.31255340576172, -38.341434478759766, -36.37031555175781, -34.399192810058594, -32.42807388305664, -30.456953048706055, -28.48583221435547, -26.514711380004883, -24.543590545654297, -22.572471618652344, -20.601350784301758, -18.630229949951172, -16.65911102294922, -14.687990188598633, -12.716869354248047, -10.745748519897461, -8.774628639221191, -6.803508281707764, -4.832387924194336, -2.86126708984375, -0.8901472091674805, 1.080972671508789, 3.052093505859375, 5.023213863372803, 6.9943342208862305, 8.9654541015625, 10.936574935913086, 12.907695770263672, 14.878815650939941, 16.84993553161621, 18.821056365966797, 20.792177200317383, 22.76329803466797, 24.734416961669922, 26.705537796020508, 28.676658630371094, 30.647777557373047, 32.618896484375, 34.59001922607422, 36.56113815307617, 38.53226089477539, 40.503379821777344, 42.47450256347656, 44.445621490478516, 46.41674041748047, 48.38786315917969, 50.35898208618164, 52.330101013183594, 54.30122375488281, 56.272342681884766, 58.24346160888672, 60.21458435058594, 62.18570327758789, 64.15682220458984, 66.12794494628906]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 9.0, 14.0, 16.0, 36.0, 59.0, 95.0, 172.0, 276.0, 516.0, 975.0, 1753.0, 3279.0, 6053.0, 10554.0, 18216.0, 29788.0, 45599.0, 65871.0, 87032.0, 107752.0, 120799.0, 122597.0, 114046.0, 96165.0, 74650.0, 53696.0, 35700.0, 22391.0, 13522.0, 7697.0, 4174.0, 2269.0, 1205.0, 677.0, 364.0, 196.0, 119.0, 76.0, 49.0, 25.0, 22.0, 15.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.28125, -50.60595703125, -48.9306640625, -47.25537109375, -45.580078125, -43.90478515625, -42.2294921875, -40.55419921875, -38.87890625, -37.20361328125, -35.5283203125, -33.85302734375, -32.177734375, -30.50244140625, -28.8271484375, -27.15185546875, -25.4765625, -23.80126953125, -22.1259765625, -20.45068359375, -18.775390625, -17.10009765625, -15.4248046875, -13.74951171875, -12.07421875, -10.39892578125, -8.7236328125, -7.04833984375, -5.373046875, -3.69775390625, -2.0224609375, -0.34716796875, 1.328125, 3.00341796875, 4.6787109375, 6.35400390625, 8.029296875, 9.70458984375, 11.3798828125, 13.05517578125, 14.73046875, 16.40576171875, 18.0810546875, 19.75634765625, 21.431640625, 23.10693359375, 24.7822265625, 26.45751953125, 28.1328125, 29.80810546875, 31.4833984375, 33.15869140625, 34.833984375, 36.50927734375, 38.1845703125, 39.85986328125, 41.53515625, 43.21044921875, 44.8857421875, 46.56103515625, 48.236328125, 49.91162109375, 51.5869140625, 53.26220703125, 54.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 7.0, 8.0, 10.0, 15.0, 13.0, 26.0, 16.0, 20.0, 18.0, 36.0, 36.0, 29.0, 39.0, 23.0, 43.0, 54.0, 33.0, 38.0, 34.0, 34.0, 48.0, 43.0, 44.0, 32.0, 42.0, 27.0, 33.0, 26.0, 30.0, 21.0, 16.0, 13.0, 12.0, 11.0, 14.0, 10.0, 4.0, 5.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-58.4375, -56.513671875, -54.58984375, -52.666015625, -50.7421875, -48.818359375, -46.89453125, -44.970703125, -43.046875, -41.123046875, -39.19921875, -37.275390625, -35.3515625, -33.427734375, -31.50390625, -29.580078125, -27.65625, -25.732421875, -23.80859375, -21.884765625, -19.9609375, -18.037109375, -16.11328125, -14.189453125, -12.265625, -10.341796875, -8.41796875, -6.494140625, -4.5703125, -2.646484375, -0.72265625, 1.201171875, 3.125, 5.048828125, 6.97265625, 8.896484375, 10.8203125, 12.744140625, 14.66796875, 16.591796875, 18.515625, 20.439453125, 22.36328125, 24.287109375, 26.2109375, 28.134765625, 30.05859375, 31.982421875, 33.90625, 35.830078125, 37.75390625, 39.677734375, 41.6015625, 43.525390625, 45.44921875, 47.373046875, 49.296875, 51.220703125, 53.14453125, 55.068359375, 56.9921875, 58.916015625, 60.83984375, 62.763671875, 64.6875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 28.0, 42.0, 72.0, 118.0, 232.0, 400.0, 716.0, 1124.0, 1976.0, 3389.0, 5614.0, 9282.0, 14744.0, 22655.0, 33012.0, 47160.0, 62745.0, 79667.0, 93982.0, 104757.0, 106934.0, 102408.0, 91338.0, 76778.0, 59012.0, 44307.0, 30819.0, 20864.0, 13379.0, 8519.0, 5105.0, 3097.0, 1836.0, 1080.0, 566.0, 343.0, 185.0, 89.0, 62.0, 40.0, 27.0, 13.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -36.9443359375, -35.544921875, -34.1455078125, -32.74609375, -31.3466796875, -29.947265625, -28.5478515625, -27.1484375, -25.7490234375, -24.349609375, -22.9501953125, -21.55078125, -20.1513671875, -18.751953125, -17.3525390625, -15.953125, -14.5537109375, -13.154296875, -11.7548828125, -10.35546875, -8.9560546875, -7.556640625, -6.1572265625, -4.7578125, -3.3583984375, -1.958984375, -0.5595703125, 0.83984375, 2.2392578125, 3.638671875, 5.0380859375, 6.4375, 7.8369140625, 9.236328125, 10.6357421875, 12.03515625, 13.4345703125, 14.833984375, 16.2333984375, 17.6328125, 19.0322265625, 20.431640625, 21.8310546875, 23.23046875, 24.6298828125, 26.029296875, 27.4287109375, 28.828125, 30.2275390625, 31.626953125, 33.0263671875, 34.42578125, 35.8251953125, 37.224609375, 38.6240234375, 40.0234375, 41.4228515625, 42.822265625, 44.2216796875, 45.62109375, 47.0205078125, 48.419921875, 49.8193359375, 51.21875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 14.0, 11.0, 23.0, 24.0, 23.0, 24.0, 28.0, 41.0, 33.0, 40.0, 40.0, 33.0, 30.0, 39.0, 31.0, 45.0, 52.0, 33.0, 31.0, 33.0, 26.0, 36.0, 30.0, 23.0, 31.0, 32.0, 17.0, 18.0, 14.0, 13.0, 6.0, 11.0, 11.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -37.95361328125, -36.7509765625, -35.54833984375, -34.345703125, -33.14306640625, -31.9404296875, -30.73779296875, -29.53515625, -28.33251953125, -27.1298828125, -25.92724609375, -24.724609375, -23.52197265625, -22.3193359375, -21.11669921875, -19.9140625, -18.71142578125, -17.5087890625, -16.30615234375, -15.103515625, -13.90087890625, -12.6982421875, -11.49560546875, -10.29296875, -9.09033203125, -7.8876953125, -6.68505859375, -5.482421875, -4.27978515625, -3.0771484375, -1.87451171875, -0.671875, 0.53076171875, 1.7333984375, 2.93603515625, 4.138671875, 5.34130859375, 6.5439453125, 7.74658203125, 8.94921875, 10.15185546875, 11.3544921875, 12.55712890625, 13.759765625, 14.96240234375, 16.1650390625, 17.36767578125, 18.5703125, 19.77294921875, 20.9755859375, 22.17822265625, 23.380859375, 24.58349609375, 25.7861328125, 26.98876953125, 28.19140625, 29.39404296875, 30.5966796875, 31.79931640625, 33.001953125, 34.20458984375, 35.4072265625, 36.60986328125, 37.8125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 7.0, 9.0, 15.0, 16.0, 28.0, 40.0, 63.0, 83.0, 112.0, 171.0, 281.0, 409.0, 635.0, 965.0, 1399.0, 2245.0, 3617.0, 5312.0, 8165.0, 12283.0, 17880.0, 26066.0, 36264.0, 49083.0, 62972.0, 77076.0, 89514.0, 97786.0, 99381.0, 95072.0, 85738.0, 72287.0, 57817.0, 44470.0, 32111.0, 22807.0, 15819.0, 10431.0, 6795.0, 4734.0, 2943.0, 1986.0, 1300.0, 824.0, 539.0, 323.0, 233.0, 148.0, 86.0, 76.0, 56.0, 29.0, 27.0, 15.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0], "bins": [-15.8359375, -15.345947265625, -14.85595703125, -14.365966796875, -13.8759765625, -13.385986328125, -12.89599609375, -12.406005859375, -11.916015625, -11.426025390625, -10.93603515625, -10.446044921875, -9.9560546875, -9.466064453125, -8.97607421875, -8.486083984375, -7.99609375, -7.506103515625, -7.01611328125, -6.526123046875, -6.0361328125, -5.546142578125, -5.05615234375, -4.566162109375, -4.076171875, -3.586181640625, -3.09619140625, -2.606201171875, -2.1162109375, -1.626220703125, -1.13623046875, -0.646240234375, -0.15625, 0.333740234375, 0.82373046875, 1.313720703125, 1.8037109375, 2.293701171875, 2.78369140625, 3.273681640625, 3.763671875, 4.253662109375, 4.74365234375, 5.233642578125, 5.7236328125, 6.213623046875, 6.70361328125, 7.193603515625, 7.68359375, 8.173583984375, 8.66357421875, 9.153564453125, 9.6435546875, 10.133544921875, 10.62353515625, 11.113525390625, 11.603515625, 12.093505859375, 12.58349609375, 13.073486328125, 13.5634765625, 14.053466796875, 14.54345703125, 15.033447265625, 15.5234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 17.0, 15.0, 18.0, 19.0, 26.0, 39.0, 36.0, 37.0, 51.0, 31.0, 60.0, 44.0, 61.0, 63.0, 59.0, 51.0, 43.0, 43.0, 31.0, 43.0, 34.0, 38.0, 26.0, 23.0, 23.0, 13.0, 8.0, 11.0, 4.0, 3.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002838134765625, -0.0027550160884857178, -0.0026718974113464355, -0.0025887787342071533, -0.002505660057067871, -0.002422541379928589, -0.0023394227027893066, -0.0022563040256500244, -0.002173185348510742, -0.00209006667137146, -0.0020069479942321777, -0.0019238293170928955, -0.0018407106399536133, -0.001757591962814331, -0.0016744732856750488, -0.0015913546085357666, -0.0015082359313964844, -0.0014251172542572021, -0.00134199857711792, -0.0012588798999786377, -0.0011757612228393555, -0.0010926425457000732, -0.001009523868560791, -0.0009264051914215088, -0.0008432865142822266, -0.0007601678371429443, -0.0006770491600036621, -0.0005939304828643799, -0.0005108118057250977, -0.00042769312858581543, -0.0003445744514465332, -0.000261455774307251, -0.00017833709716796875, -9.521842002868652e-05, -1.2099742889404297e-05, 7.101893424987793e-05, 0.00015413761138916016, 0.00023725628852844238, 0.0003203749656677246, 0.00040349364280700684, 0.00048661231994628906, 0.0005697309970855713, 0.0006528496742248535, 0.0007359683513641357, 0.000819087028503418, 0.0009022057056427002, 0.0009853243827819824, 0.0010684430599212646, 0.0011515617370605469, 0.001234680414199829, 0.0013177990913391113, 0.0014009177684783936, 0.0014840364456176758, 0.001567155122756958, 0.0016502737998962402, 0.0017333924770355225, 0.0018165111541748047, 0.001899629831314087, 0.001982748508453369, 0.0020658671855926514, 0.0021489858627319336, 0.002232104539871216, 0.002315223217010498, 0.0023983418941497803, 0.0024814605712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 17.0, 24.0, 27.0, 30.0, 61.0, 108.0, 164.0, 246.0, 413.0, 645.0, 1092.0, 1808.0, 2903.0, 4750.0, 7764.0, 12540.0, 20049.0, 30420.0, 44945.0, 63377.0, 83710.0, 102572.0, 115229.0, 118124.0, 110168.0, 94337.0, 74417.0, 54443.0, 37555.0, 24931.0, 16044.0, 9984.0, 6040.0, 3722.0, 2251.0, 1362.0, 903.0, 517.0, 304.0, 210.0, 135.0, 68.0, 40.0, 41.0, 23.0, 16.0, 14.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.788330078125, -18.12353515625, -17.458740234375, -16.7939453125, -16.129150390625, -15.46435546875, -14.799560546875, -14.134765625, -13.469970703125, -12.80517578125, -12.140380859375, -11.4755859375, -10.810791015625, -10.14599609375, -9.481201171875, -8.81640625, -8.151611328125, -7.48681640625, -6.822021484375, -6.1572265625, -5.492431640625, -4.82763671875, -4.162841796875, -3.498046875, -2.833251953125, -2.16845703125, -1.503662109375, -0.8388671875, -0.174072265625, 0.49072265625, 1.155517578125, 1.8203125, 2.485107421875, 3.14990234375, 3.814697265625, 4.4794921875, 5.144287109375, 5.80908203125, 6.473876953125, 7.138671875, 7.803466796875, 8.46826171875, 9.133056640625, 9.7978515625, 10.462646484375, 11.12744140625, 11.792236328125, 12.45703125, 13.121826171875, 13.78662109375, 14.451416015625, 15.1162109375, 15.781005859375, 16.44580078125, 17.110595703125, 17.775390625, 18.440185546875, 19.10498046875, 19.769775390625, 20.4345703125, 21.099365234375, 21.76416015625, 22.428955078125, 23.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 12.0, 5.0, 14.0, 4.0, 12.0, 12.0, 17.0, 20.0, 21.0, 21.0, 28.0, 17.0, 27.0, 39.0, 48.0, 33.0, 33.0, 33.0, 45.0, 51.0, 48.0, 30.0, 41.0, 34.0, 43.0, 40.0, 25.0, 28.0, 21.0, 21.0, 20.0, 20.0, 14.0, 23.0, 27.0, 9.0, 9.0, 9.0, 9.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.96484375, -7.69805908203125, -7.4312744140625, -7.16448974609375, -6.897705078125, -6.63092041015625, -6.3641357421875, -6.09735107421875, -5.83056640625, -5.56378173828125, -5.2969970703125, -5.03021240234375, -4.763427734375, -4.49664306640625, -4.2298583984375, -3.96307373046875, -3.6962890625, -3.42950439453125, -3.1627197265625, -2.89593505859375, -2.629150390625, -2.36236572265625, -2.0955810546875, -1.82879638671875, -1.56201171875, -1.29522705078125, -1.0284423828125, -0.76165771484375, -0.494873046875, -0.22808837890625, 0.0386962890625, 0.30548095703125, 0.572265625, 0.83905029296875, 1.1058349609375, 1.37261962890625, 1.639404296875, 1.90618896484375, 2.1729736328125, 2.43975830078125, 2.70654296875, 2.97332763671875, 3.2401123046875, 3.50689697265625, 3.773681640625, 4.04046630859375, 4.3072509765625, 4.57403564453125, 4.8408203125, 5.10760498046875, 5.3743896484375, 5.64117431640625, 5.907958984375, 6.17474365234375, 6.4415283203125, 6.70831298828125, 6.97509765625, 7.24188232421875, 7.5086669921875, 7.77545166015625, 8.042236328125, 8.30902099609375, 8.5758056640625, 8.84259033203125, 9.109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 10.0, 2.0, 10.0, 9.0, 11.0, 8.0, 8.0, 11.0, 16.0, 22.0, 16.0, 13.0, 27.0, 34.0, 32.0, 33.0, 41.0, 40.0, 37.0, 28.0, 31.0, 46.0, 32.0, 44.0, 40.0, 32.0, 29.0, 30.0, 28.0, 26.0, 26.0, 23.0, 28.0, 26.0, 27.0, 18.0, 25.0, 9.0, 9.0, 9.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.527687072753906, -54.86153030395508, -53.19537353515625, -51.52921676635742, -49.863059997558594, -48.19690704345703, -46.53074645996094, -44.864593505859375, -43.19843673706055, -41.53227996826172, -39.86612319946289, -38.19996643066406, -36.533809661865234, -34.867652893066406, -33.201499938964844, -31.535343170166016, -29.869184494018555, -28.203027725219727, -26.5368709564209, -24.870716094970703, -23.204559326171875, -21.538402557373047, -19.87224578857422, -18.20608901977539, -16.539932250976562, -14.873775482177734, -13.207619667053223, -11.541462898254395, -9.875307083129883, -8.209150314331055, -6.542993545532227, -4.876837730407715, -3.210681915283203, -1.5445255041122437, 0.12163090705871582, 1.7877874374389648, 3.4539437294006348, 5.120100021362305, 6.786256790161133, 8.452412605285645, 10.118569374084473, 11.7847261428833, 13.450881958007812, 15.11703872680664, 16.78319549560547, 18.449352264404297, 20.115509033203125, 21.78166389465332, 23.44782066345215, 25.113977432250977, 26.780134201049805, 28.4462890625, 30.112445831298828, 31.778602600097656, 33.444759368896484, 35.11091613769531, 36.77707290649414, 38.44322967529297, 40.1093864440918, 41.775543212890625, 43.44169998168945, 45.10785675048828, 46.774009704589844, 48.44016647338867, 50.1063232421875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 15.0, 14.0, 8.0, 20.0, 10.0, 17.0, 20.0, 28.0, 23.0, 25.0, 34.0, 37.0, 38.0, 29.0, 38.0, 52.0, 34.0, 47.0, 45.0, 46.0, 43.0, 40.0, 39.0, 39.0, 30.0, 42.0, 25.0, 26.0, 16.0, 22.0, 20.0, 16.0, 13.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.81147384643555, -55.67109680175781, -53.53071594238281, -51.39033889770508, -49.249961853027344, -47.109580993652344, -44.96920394897461, -42.828826904296875, -40.688446044921875, -38.54806900024414, -36.40768814086914, -34.267311096191406, -32.12693405151367, -29.986555099487305, -27.846176147460938, -25.705799102783203, -23.56542205810547, -21.4250431060791, -19.284666061401367, -17.144287109375, -15.00390911102295, -12.863531112670898, -10.723152160644531, -8.58277416229248, -6.44239616394043, -4.302018165588379, -2.16163969039917, -0.021261215209960938, 2.11911678314209, 4.259494781494141, 6.399873733520508, 8.540251731872559, 10.680633544921875, 12.821011543273926, 14.961389541625977, 17.101768493652344, 19.242145538330078, 21.382524490356445, 23.522903442382812, 25.663280487060547, 27.803659439086914, 29.94403839111328, 32.084415435791016, 34.22479248046875, 36.36517333984375, 38.505550384521484, 40.64592742919922, 42.78630828857422, 44.92668533325195, 47.06706237792969, 49.20744323730469, 51.34782028198242, 53.488197326660156, 55.628578186035156, 57.76895523071289, 59.909332275390625, 62.049713134765625, 64.19009399414062, 66.3304672241211, 68.4708480834961, 70.6112289428711, 72.75160217285156, 74.89198303222656, 77.03236389160156, 79.17273712158203]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 24.0, 28.0, 47.0, 82.0, 129.0, 243.0, 456.0, 780.0, 1201.0, 2057.0, 3362.0, 5304.0, 8751.0, 13824.0, 22019.0, 34292.0, 52399.0, 78231.0, 114713.0, 160931.0, 217855.0, 277919.0, 339984.0, 388691.0, 414729.0, 409730.0, 381396.0, 329633.0, 267333.0, 206089.0, 149846.0, 106846.0, 72593.0, 47944.0, 31307.0, 20228.0, 12459.0, 7981.0, 4838.0, 3064.0, 1999.0, 1133.0, 712.0, 421.0, 230.0, 164.0, 113.0, 71.0, 43.0, 27.0, 10.0, 11.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-41.8125, -40.45947265625, -39.1064453125, -37.75341796875, -36.400390625, -35.04736328125, -33.6943359375, -32.34130859375, -30.98828125, -29.63525390625, -28.2822265625, -26.92919921875, -25.576171875, -24.22314453125, -22.8701171875, -21.51708984375, -20.1640625, -18.81103515625, -17.4580078125, -16.10498046875, -14.751953125, -13.39892578125, -12.0458984375, -10.69287109375, -9.33984375, -7.98681640625, -6.6337890625, -5.28076171875, -3.927734375, -2.57470703125, -1.2216796875, 0.13134765625, 1.484375, 2.83740234375, 4.1904296875, 5.54345703125, 6.896484375, 8.24951171875, 9.6025390625, 10.95556640625, 12.30859375, 13.66162109375, 15.0146484375, 16.36767578125, 17.720703125, 19.07373046875, 20.4267578125, 21.77978515625, 23.1328125, 24.48583984375, 25.8388671875, 27.19189453125, 28.544921875, 29.89794921875, 31.2509765625, 32.60400390625, 33.95703125, 35.31005859375, 36.6630859375, 38.01611328125, 39.369140625, 40.72216796875, 42.0751953125, 43.42822265625, 44.78125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 16.0, 11.0, 8.0, 15.0, 16.0, 19.0, 18.0, 30.0, 19.0, 21.0, 37.0, 42.0, 26.0, 37.0, 37.0, 44.0, 39.0, 42.0, 52.0, 41.0, 39.0, 42.0, 38.0, 40.0, 37.0, 36.0, 29.0, 20.0, 22.0, 19.0, 18.0, 20.0, 15.0, 9.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.03125, -49.15478515625, -47.2783203125, -45.40185546875, -43.525390625, -41.64892578125, -39.7724609375, -37.89599609375, -36.01953125, -34.14306640625, -32.2666015625, -30.39013671875, -28.513671875, -26.63720703125, -24.7607421875, -22.88427734375, -21.0078125, -19.13134765625, -17.2548828125, -15.37841796875, -13.501953125, -11.62548828125, -9.7490234375, -7.87255859375, -5.99609375, -4.11962890625, -2.2431640625, -0.36669921875, 1.509765625, 3.38623046875, 5.2626953125, 7.13916015625, 9.015625, 10.89208984375, 12.7685546875, 14.64501953125, 16.521484375, 18.39794921875, 20.2744140625, 22.15087890625, 24.02734375, 25.90380859375, 27.7802734375, 29.65673828125, 31.533203125, 33.40966796875, 35.2861328125, 37.16259765625, 39.0390625, 40.91552734375, 42.7919921875, 44.66845703125, 46.544921875, 48.42138671875, 50.2978515625, 52.17431640625, 54.05078125, 55.92724609375, 57.8037109375, 59.68017578125, 61.556640625, 63.43310546875, 65.3095703125, 67.18603515625, 69.0625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 15.0, 27.0, 46.0, 93.0, 190.0, 295.0, 500.0, 884.0, 1591.0, 2477.0, 4332.0, 7086.0, 11487.0, 18468.0, 29606.0, 45764.0, 68623.0, 101308.0, 140926.0, 191202.0, 248418.0, 304618.0, 354182.0, 387647.0, 398152.0, 384156.0, 348207.0, 299060.0, 242316.0, 185788.0, 137275.0, 95939.0, 66231.0, 44127.0, 28019.0, 17582.0, 11051.0, 6751.0, 4085.0, 2358.0, 1403.0, 824.0, 485.0, 284.0, 170.0, 92.0, 71.0, 35.0, 16.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-46.46875, -45.03662109375, -43.6044921875, -42.17236328125, -40.740234375, -39.30810546875, -37.8759765625, -36.44384765625, -35.01171875, -33.57958984375, -32.1474609375, -30.71533203125, -29.283203125, -27.85107421875, -26.4189453125, -24.98681640625, -23.5546875, -22.12255859375, -20.6904296875, -19.25830078125, -17.826171875, -16.39404296875, -14.9619140625, -13.52978515625, -12.09765625, -10.66552734375, -9.2333984375, -7.80126953125, -6.369140625, -4.93701171875, -3.5048828125, -2.07275390625, -0.640625, 0.79150390625, 2.2236328125, 3.65576171875, 5.087890625, 6.52001953125, 7.9521484375, 9.38427734375, 10.81640625, 12.24853515625, 13.6806640625, 15.11279296875, 16.544921875, 17.97705078125, 19.4091796875, 20.84130859375, 22.2734375, 23.70556640625, 25.1376953125, 26.56982421875, 28.001953125, 29.43408203125, 30.8662109375, 32.29833984375, 33.73046875, 35.16259765625, 36.5947265625, 38.02685546875, 39.458984375, 40.89111328125, 42.3232421875, 43.75537109375, 45.1875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 24.0, 35.0, 53.0, 60.0, 64.0, 81.0, 86.0, 108.0, 107.0, 138.0, 113.0, 156.0, 155.0, 188.0, 223.0, 166.0, 198.0, 195.0, 191.0, 196.0, 157.0, 168.0, 149.0, 156.0, 117.0, 102.0, 92.0, 82.0, 79.0, 71.0, 48.0, 54.0, 44.0, 29.0, 23.0, 31.0, 10.0, 19.0, 14.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0], "bins": [-25.15625, -24.398681640625, -23.64111328125, -22.883544921875, -22.1259765625, -21.368408203125, -20.61083984375, -19.853271484375, -19.095703125, -18.338134765625, -17.58056640625, -16.822998046875, -16.0654296875, -15.307861328125, -14.55029296875, -13.792724609375, -13.03515625, -12.277587890625, -11.52001953125, -10.762451171875, -10.0048828125, -9.247314453125, -8.48974609375, -7.732177734375, -6.974609375, -6.217041015625, -5.45947265625, -4.701904296875, -3.9443359375, -3.186767578125, -2.42919921875, -1.671630859375, -0.9140625, -0.156494140625, 0.60107421875, 1.358642578125, 2.1162109375, 2.873779296875, 3.63134765625, 4.388916015625, 5.146484375, 5.904052734375, 6.66162109375, 7.419189453125, 8.1767578125, 8.934326171875, 9.69189453125, 10.449462890625, 11.20703125, 11.964599609375, 12.72216796875, 13.479736328125, 14.2373046875, 14.994873046875, 15.75244140625, 16.510009765625, 17.267578125, 18.025146484375, 18.78271484375, 19.540283203125, 20.2978515625, 21.055419921875, 21.81298828125, 22.570556640625, 23.328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 6.0, 11.0, 15.0, 12.0, 9.0, 16.0, 20.0, 22.0, 26.0, 24.0, 27.0, 36.0, 39.0, 28.0, 38.0, 37.0, 42.0, 45.0, 50.0, 44.0, 43.0, 35.0, 38.0, 26.0, 37.0, 27.0, 26.0, 26.0, 24.0, 27.0, 12.0, 24.0, 12.0, 16.0, 9.0, 11.0, 3.0, 8.0, 8.0, 7.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.483909606933594, -53.61665725708008, -51.74940872192383, -49.88215637207031, -48.01490783691406, -46.14765548706055, -44.28040313720703, -42.41315460205078, -40.545902252197266, -38.67864990234375, -36.8114013671875, -34.944149017333984, -33.076900482177734, -31.20964813232422, -29.342397689819336, -27.475147247314453, -25.60789680480957, -23.740646362304688, -21.873395919799805, -20.006145477294922, -18.138893127441406, -16.271642684936523, -14.40439224243164, -12.537140846252441, -10.669890403747559, -8.802639961242676, -6.935388565063477, -5.068138122558594, -3.2008872032165527, -1.3336362838745117, 0.5336141586303711, 2.4008655548095703, 4.268115997314453, 6.135366916656494, 8.002617835998535, 9.869868278503418, 11.737119674682617, 13.6043701171875, 15.471620559692383, 17.338871002197266, 19.20612335205078, 21.073373794555664, 22.940624237060547, 24.807876586914062, 26.675127029418945, 28.542377471923828, 30.40962791442871, 32.276878356933594, 34.144126892089844, 36.01137924194336, 37.87862777709961, 39.745880126953125, 41.613128662109375, 43.48038101196289, 45.347633361816406, 47.214881896972656, 49.08213424682617, 50.94938659667969, 52.81663513183594, 54.68388748168945, 56.5511360168457, 58.41838836669922, 60.28563690185547, 62.152889251708984, 64.0201416015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 1.0, 9.0, 7.0, 11.0, 12.0, 11.0, 22.0, 25.0, 15.0, 27.0, 26.0, 21.0, 17.0, 24.0, 30.0, 36.0, 26.0, 37.0, 40.0, 31.0, 29.0, 40.0, 40.0, 31.0, 38.0, 45.0, 33.0, 36.0, 31.0, 29.0, 32.0, 20.0, 25.0, 19.0, 16.0, 15.0, 17.0, 12.0, 6.0, 7.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-50.905338287353516, -49.10744857788086, -47.30955505371094, -45.51166534423828, -43.71377182006836, -41.9158821105957, -40.11798858642578, -38.320098876953125, -36.52220916748047, -34.72431945800781, -32.92642593383789, -31.128536224365234, -29.330642700195312, -27.532752990722656, -25.734861373901367, -23.936969757080078, -22.139076232910156, -20.341184616088867, -18.543292999267578, -16.745403289794922, -14.947510719299316, -13.149619102478027, -11.351728439331055, -9.553836822509766, -7.755945205688477, -5.9580535888671875, -4.160162448883057, -2.362271308898926, -0.5643796920776367, 1.2335119247436523, 3.031402587890625, 4.829294204711914, 6.627189636230469, 8.425081253051758, 10.222972869873047, 12.02086353302002, 13.818755149841309, 15.616646766662598, 17.41453742980957, 19.21242904663086, 21.01032066345215, 22.808212280273438, 24.606103897094727, 26.403995513916016, 28.201885223388672, 29.999778747558594, 31.79766845703125, 33.595558166503906, 35.39345169067383, 37.191341400146484, 38.989234924316406, 40.78712463378906, 42.585018157958984, 44.38290786743164, 46.18080139160156, 47.97869110107422, 49.776580810546875, 51.57447052001953, 53.37236404418945, 55.17025375366211, 56.96814727783203, 58.76603698730469, 60.563926696777344, 62.361820220947266, 64.15971374511719]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 10.0, 14.0, 19.0, 30.0, 41.0, 67.0, 99.0, 157.0, 214.0, 303.0, 477.0, 690.0, 1068.0, 1575.0, 2380.0, 3621.0, 5432.0, 7967.0, 11607.0, 17099.0, 24088.0, 34120.0, 46662.0, 59974.0, 75804.0, 90004.0, 99220.0, 102146.0, 97896.0, 87647.0, 72903.0, 57617.0, 43967.0, 31704.0, 22688.0, 15950.0, 10989.0, 7450.0, 4882.0, 3232.0, 2244.0, 1514.0, 974.0, 692.0, 415.0, 293.0, 213.0, 142.0, 65.0, 74.0, 33.0, 33.0, 15.0, 13.0, 10.0, 7.0, 4.0, 5.0, 0.0, 3.0, 3.0], "bins": [-9.015625, -8.7191162109375, -8.422607421875, -8.1260986328125, -7.82958984375, -7.5330810546875, -7.236572265625, -6.9400634765625, -6.6435546875, -6.3470458984375, -6.050537109375, -5.7540283203125, -5.45751953125, -5.1610107421875, -4.864501953125, -4.5679931640625, -4.271484375, -3.9749755859375, -3.678466796875, -3.3819580078125, -3.08544921875, -2.7889404296875, -2.492431640625, -2.1959228515625, -1.8994140625, -1.6029052734375, -1.306396484375, -1.0098876953125, -0.71337890625, -0.4168701171875, -0.120361328125, 0.1761474609375, 0.47265625, 0.7691650390625, 1.065673828125, 1.3621826171875, 1.65869140625, 1.9552001953125, 2.251708984375, 2.5482177734375, 2.8447265625, 3.1412353515625, 3.437744140625, 3.7342529296875, 4.03076171875, 4.3272705078125, 4.623779296875, 4.9202880859375, 5.216796875, 5.5133056640625, 5.809814453125, 6.1063232421875, 6.40283203125, 6.6993408203125, 6.995849609375, 7.2923583984375, 7.5888671875, 7.8853759765625, 8.181884765625, 8.4783935546875, 8.77490234375, 9.0714111328125, 9.367919921875, 9.6644287109375, 9.9609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 0.0, 9.0, 7.0, 12.0, 11.0, 13.0, 22.0, 24.0, 15.0, 28.0, 25.0, 20.0, 17.0, 25.0, 33.0, 33.0, 31.0, 32.0, 40.0, 31.0, 32.0, 42.0, 34.0, 31.0, 43.0, 42.0, 34.0, 33.0, 31.0, 29.0, 32.0, 23.0, 23.0, 19.0, 16.0, 19.0, 13.0, 12.0, 5.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.125, -49.3232421875, -47.521484375, -45.7197265625, -43.91796875, -42.1162109375, -40.314453125, -38.5126953125, -36.7109375, -34.9091796875, -33.107421875, -31.3056640625, -29.50390625, -27.7021484375, -25.900390625, -24.0986328125, -22.296875, -20.4951171875, -18.693359375, -16.8916015625, -15.08984375, -13.2880859375, -11.486328125, -9.6845703125, -7.8828125, -6.0810546875, -4.279296875, -2.4775390625, -0.67578125, 1.1259765625, 2.927734375, 4.7294921875, 6.53125, 8.3330078125, 10.134765625, 11.9365234375, 13.73828125, 15.5400390625, 17.341796875, 19.1435546875, 20.9453125, 22.7470703125, 24.548828125, 26.3505859375, 28.15234375, 29.9541015625, 31.755859375, 33.5576171875, 35.359375, 37.1611328125, 38.962890625, 40.7646484375, 42.56640625, 44.3681640625, 46.169921875, 47.9716796875, 49.7734375, 51.5751953125, 53.376953125, 55.1787109375, 56.98046875, 58.7822265625, 60.583984375, 62.3857421875, 64.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 8.0, 5.0, 6.0, 8.0, 26.0, 22.0, 31.0, 72.0, 82.0, 149.0, 260.0, 422.0, 788.0, 1370.0, 2519.0, 4758.0, 8775.0, 17684.0, 38253.0, 832646.0, 89846.0, 24415.0, 12210.0, 6457.0, 3443.0, 1853.0, 1018.0, 597.0, 319.0, 189.0, 110.0, 85.0, 41.0, 32.0, 20.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.5, -41.07080078125, -39.6416015625, -38.21240234375, -36.783203125, -35.35400390625, -33.9248046875, -32.49560546875, -31.06640625, -29.63720703125, -28.2080078125, -26.77880859375, -25.349609375, -23.92041015625, -22.4912109375, -21.06201171875, -19.6328125, -18.20361328125, -16.7744140625, -15.34521484375, -13.916015625, -12.48681640625, -11.0576171875, -9.62841796875, -8.19921875, -6.77001953125, -5.3408203125, -3.91162109375, -2.482421875, -1.05322265625, 0.3759765625, 1.80517578125, 3.234375, 4.66357421875, 6.0927734375, 7.52197265625, 8.951171875, 10.38037109375, 11.8095703125, 13.23876953125, 14.66796875, 16.09716796875, 17.5263671875, 18.95556640625, 20.384765625, 21.81396484375, 23.2431640625, 24.67236328125, 26.1015625, 27.53076171875, 28.9599609375, 30.38916015625, 31.818359375, 33.24755859375, 34.6767578125, 36.10595703125, 37.53515625, 38.96435546875, 40.3935546875, 41.82275390625, 43.251953125, 44.68115234375, 46.1103515625, 47.53955078125, 48.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 11.0, 12.0, 9.0, 16.0, 14.0, 21.0, 28.0, 16.0, 19.0, 29.0, 35.0, 36.0, 40.0, 46.0, 36.0, 59.0, 46.0, 43.0, 31.0, 48.0, 47.0, 27.0, 26.0, 35.0, 38.0, 35.0, 23.0, 17.0, 19.0, 17.0, 13.0, 16.0, 13.0, 19.0, 10.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.41455078125, -42.0791015625, -40.74365234375, -39.408203125, -38.07275390625, -36.7373046875, -35.40185546875, -34.06640625, -32.73095703125, -31.3955078125, -30.06005859375, -28.724609375, -27.38916015625, -26.0537109375, -24.71826171875, -23.3828125, -22.04736328125, -20.7119140625, -19.37646484375, -18.041015625, -16.70556640625, -15.3701171875, -14.03466796875, -12.69921875, -11.36376953125, -10.0283203125, -8.69287109375, -7.357421875, -6.02197265625, -4.6865234375, -3.35107421875, -2.015625, -0.68017578125, 0.6552734375, 1.99072265625, 3.326171875, 4.66162109375, 5.9970703125, 7.33251953125, 8.66796875, 10.00341796875, 11.3388671875, 12.67431640625, 14.009765625, 15.34521484375, 16.6806640625, 18.01611328125, 19.3515625, 20.68701171875, 22.0224609375, 23.35791015625, 24.693359375, 26.02880859375, 27.3642578125, 28.69970703125, 30.03515625, 31.37060546875, 32.7060546875, 34.04150390625, 35.376953125, 36.71240234375, 38.0478515625, 39.38330078125, 40.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 6.0, 10.0, 22.0, 17.0, 21.0, 37.0, 34.0, 41.0, 75.0, 93.0, 152.0, 218.0, 370.0, 568.0, 1047.0, 1792.0, 3351.0, 6776.0, 13705.0, 29719.0, 336975.0, 590908.0, 32016.0, 14821.0, 7268.0, 3591.0, 1941.0, 1134.0, 636.0, 348.0, 240.0, 189.0, 110.0, 78.0, 57.0, 37.0, 27.0, 21.0, 19.0, 17.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.50390625, -3.39105224609375, -3.2781982421875, -3.16534423828125, -3.052490234375, -2.93963623046875, -2.8267822265625, -2.71392822265625, -2.60107421875, -2.48822021484375, -2.3753662109375, -2.26251220703125, -2.149658203125, -2.03680419921875, -1.9239501953125, -1.81109619140625, -1.6982421875, -1.58538818359375, -1.4725341796875, -1.35968017578125, -1.246826171875, -1.13397216796875, -1.0211181640625, -0.90826416015625, -0.79541015625, -0.68255615234375, -0.5697021484375, -0.45684814453125, -0.343994140625, -0.23114013671875, -0.1182861328125, -0.00543212890625, 0.107421875, 0.22027587890625, 0.3331298828125, 0.44598388671875, 0.558837890625, 0.67169189453125, 0.7845458984375, 0.89739990234375, 1.01025390625, 1.12310791015625, 1.2359619140625, 1.34881591796875, 1.461669921875, 1.57452392578125, 1.6873779296875, 1.80023193359375, 1.9130859375, 2.02593994140625, 2.1387939453125, 2.25164794921875, 2.364501953125, 2.47735595703125, 2.5902099609375, 2.70306396484375, 2.81591796875, 2.92877197265625, 3.0416259765625, 3.15447998046875, 3.267333984375, 3.38018798828125, 3.4930419921875, 3.60589599609375, 3.71875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 13.0, 12.0, 20.0, 26.0, 24.0, 28.0, 33.0, 48.0, 40.0, 50.0, 49.0, 61.0, 56.0, 64.0, 53.0, 52.0, 65.0, 41.0, 42.0, 29.0, 30.0, 20.0, 31.0, 23.0, 16.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.372550994157791e-05, -9.011663496494293e-05, -8.650775998830795e-05, -8.289888501167297e-05, -7.9290010035038e-05, -7.568113505840302e-05, -7.207226008176804e-05, -6.846338510513306e-05, -6.485451012849808e-05, -6.12456351518631e-05, -5.763676017522812e-05, -5.402788519859314e-05, -5.041901022195816e-05, -4.681013524532318e-05, -4.32012602686882e-05, -3.959238529205322e-05, -3.5983510315418243e-05, -3.2374635338783264e-05, -2.8765760362148285e-05, -2.5156885385513306e-05, -2.1548010408878326e-05, -1.7939135432243347e-05, -1.4330260455608368e-05, -1.0721385478973389e-05, -7.1125105023384094e-06, -3.50363552570343e-06, 1.0523945093154907e-07, 3.7141144275665283e-06, 7.3229894042015076e-06, 1.0931864380836487e-05, 1.4540739357471466e-05, 1.8149614334106445e-05, 2.1758489310741425e-05, 2.5367364287376404e-05, 2.8976239264011383e-05, 3.258511424064636e-05, 3.619398921728134e-05, 3.980286419391632e-05, 4.34117391705513e-05, 4.702061414718628e-05, 5.062948912382126e-05, 5.423836410045624e-05, 5.784723907709122e-05, 6.14561140537262e-05, 6.506498903036118e-05, 6.867386400699615e-05, 7.228273898363113e-05, 7.589161396026611e-05, 7.950048893690109e-05, 8.310936391353607e-05, 8.671823889017105e-05, 9.032711386680603e-05, 9.393598884344101e-05, 9.754486382007599e-05, 0.00010115373879671097, 0.00010476261377334595, 0.00010837148874998093, 0.0001119803637266159, 0.00011558923870325089, 0.00011919811367988586, 0.00012280698865652084, 0.00012641586363315582, 0.0001300247386097908, 0.00013363361358642578]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 8.0, 23.0, 26.0, 45.0, 84.0, 112.0, 188.0, 271.0, 469.0, 770.0, 1248.0, 2037.0, 3429.0, 5589.0, 9637.0, 15776.0, 26149.0, 42204.0, 65599.0, 96704.0, 132374.0, 155431.0, 147817.0, 117184.0, 83415.0, 54491.0, 34401.0, 21200.0, 12784.0, 7580.0, 4629.0, 2674.0, 1599.0, 955.0, 615.0, 400.0, 229.0, 120.0, 95.0, 68.0, 47.0, 26.0, 11.0, 12.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.900390625, -2.80914306640625, -2.7178955078125, -2.62664794921875, -2.535400390625, -2.44415283203125, -2.3529052734375, -2.26165771484375, -2.17041015625, -2.07916259765625, -1.9879150390625, -1.89666748046875, -1.805419921875, -1.71417236328125, -1.6229248046875, -1.53167724609375, -1.4404296875, -1.34918212890625, -1.2579345703125, -1.16668701171875, -1.075439453125, -0.98419189453125, -0.8929443359375, -0.80169677734375, -0.71044921875, -0.61920166015625, -0.5279541015625, -0.43670654296875, -0.345458984375, -0.25421142578125, -0.1629638671875, -0.07171630859375, 0.01953125, 0.11077880859375, 0.2020263671875, 0.29327392578125, 0.384521484375, 0.47576904296875, 0.5670166015625, 0.65826416015625, 0.74951171875, 0.84075927734375, 0.9320068359375, 1.02325439453125, 1.114501953125, 1.20574951171875, 1.2969970703125, 1.38824462890625, 1.4794921875, 1.57073974609375, 1.6619873046875, 1.75323486328125, 1.844482421875, 1.93572998046875, 2.0269775390625, 2.11822509765625, 2.20947265625, 2.30072021484375, 2.3919677734375, 2.48321533203125, 2.574462890625, 2.66571044921875, 2.7569580078125, 2.84820556640625, 2.939453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 7.0, 20.0, 10.0, 22.0, 23.0, 21.0, 25.0, 28.0, 31.0, 28.0, 34.0, 36.0, 31.0, 38.0, 33.0, 32.0, 63.0, 50.0, 51.0, 42.0, 49.0, 31.0, 33.0, 41.0, 24.0, 28.0, 34.0, 21.0, 23.0, 17.0, 19.0, 11.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2119140625, -1.1786270141601562, -1.1453399658203125, -1.1120529174804688, -1.078765869140625, -1.0454788208007812, -1.0121917724609375, -0.9789047241210938, -0.94561767578125, -0.9123306274414062, -0.8790435791015625, -0.8457565307617188, -0.812469482421875, -0.7791824340820312, -0.7458953857421875, -0.7126083374023438, -0.6793212890625, -0.6460342407226562, -0.6127471923828125, -0.5794601440429688, -0.546173095703125, -0.5128860473632812, -0.4795989990234375, -0.44631195068359375, -0.41302490234375, -0.37973785400390625, -0.3464508056640625, -0.31316375732421875, -0.279876708984375, -0.24658966064453125, -0.2133026123046875, -0.18001556396484375, -0.146728515625, -0.11344146728515625, -0.0801544189453125, -0.04686737060546875, -0.013580322265625, 0.01970672607421875, 0.0529937744140625, 0.08628082275390625, 0.11956787109375, 0.15285491943359375, 0.1861419677734375, 0.21942901611328125, 0.252716064453125, 0.28600311279296875, 0.3192901611328125, 0.35257720947265625, 0.3858642578125, 0.41915130615234375, 0.4524383544921875, 0.48572540283203125, 0.519012451171875, 0.5522994995117188, 0.5855865478515625, 0.6188735961914062, 0.65216064453125, 0.6854476928710938, 0.7187347412109375, 0.7520217895507812, 0.785308837890625, 0.8185958862304688, 0.8518829345703125, 0.8851699829101562, 0.91845703125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 15.0, 12.0, 13.0, 9.0, 19.0, 16.0, 30.0, 23.0, 17.0, 34.0, 40.0, 31.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 43.0, 34.0, 36.0, 37.0, 36.0, 30.0, 30.0, 32.0, 18.0, 26.0, 23.0, 13.0, 21.0, 19.0, 10.0, 8.0, 7.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.912818908691406, -53.04204177856445, -51.1712646484375, -49.30048751831055, -47.429710388183594, -45.55893325805664, -43.68815612792969, -41.8173828125, -39.94660186767578, -38.07582473754883, -36.205047607421875, -34.33427047729492, -32.46349334716797, -30.592716217041016, -28.721940994262695, -26.851163864135742, -24.980388641357422, -23.10961151123047, -21.238834381103516, -19.368057250976562, -17.49728012084961, -15.626503944396973, -13.755727767944336, -11.884950637817383, -10.01417350769043, -8.143396377563477, -6.272619724273682, -4.401843070983887, -2.5310659408569336, -0.6602888107299805, 1.2104873657226562, 3.0812644958496094, 4.9520416259765625, 6.822818756103516, 8.693595886230469, 10.564372062683105, 12.435149192810059, 14.305926322937012, 16.17670249938965, 18.0474796295166, 19.918256759643555, 21.789033889770508, 23.65981101989746, 25.53058624267578, 27.401363372802734, 29.272140502929688, 31.14291763305664, 33.013694763183594, 34.88447189331055, 36.7552490234375, 38.62602615356445, 40.496803283691406, 42.36758041381836, 44.23835754394531, 46.109130859375, 47.97991180419922, 49.850685119628906, 51.72146224975586, 53.59223937988281, 55.463016510009766, 57.33379364013672, 59.20457077026367, 61.075347900390625, 62.94612121582031, 64.81690216064453]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 16.0, 24.0, 20.0, 20.0, 25.0, 23.0, 22.0, 24.0, 23.0, 33.0, 31.0, 35.0, 36.0, 37.0, 24.0, 37.0, 41.0, 35.0, 34.0, 34.0, 47.0, 34.0, 31.0, 33.0, 30.0, 30.0, 21.0, 22.0, 21.0, 15.0, 17.0, 18.0, 7.0, 3.0, 12.0, 9.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.96181106567383, -49.15064239501953, -47.33946990966797, -45.52830123901367, -43.717132568359375, -41.90596008300781, -40.094791412353516, -38.28362274169922, -36.472450256347656, -34.66128158569336, -32.8501091003418, -31.0389404296875, -29.22776985168457, -27.41659927368164, -25.605430603027344, -23.794260025024414, -21.983089447021484, -20.171918869018555, -18.360748291015625, -16.549579620361328, -14.738409042358398, -12.927238464355469, -11.116068840026855, -9.304899215698242, -7.4937286376953125, -5.682558536529541, -3.8713884353637695, -2.060218334197998, -0.24904823303222656, 1.5621223449707031, 3.3732919692993164, 5.18446159362793, 6.995635986328125, 8.806806564331055, 10.617976188659668, 12.429145812988281, 14.240316390991211, 16.05148696899414, 17.862655639648438, 19.673826217651367, 21.484996795654297, 23.296167373657227, 25.107337951660156, 26.918506622314453, 28.729677200317383, 30.540847778320312, 32.35201644897461, 34.163185119628906, 35.97435760498047, 37.785526275634766, 39.59669876098633, 41.407867431640625, 43.21903991699219, 45.030208587646484, 46.84137725830078, 48.652549743652344, 50.46371841430664, 52.27488708496094, 54.0860595703125, 55.8972282409668, 57.708396911621094, 59.519569396972656, 61.33073806762695, 63.14190673828125, 64.95307922363281]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 12.0, 25.0, 40.0, 71.0, 89.0, 168.0, 263.0, 448.0, 739.0, 1193.0, 1930.0, 3152.0, 4795.0, 7269.0, 10550.0, 15717.0, 22293.0, 30518.0, 40658.0, 52069.0, 63835.0, 75542.0, 83509.0, 89533.0, 90778.0, 86503.0, 79057.0, 68847.0, 57659.0, 45140.0, 35299.0, 25929.0, 18239.0, 12830.0, 8514.0, 5449.0, 3705.0, 2335.0, 1444.0, 958.0, 547.0, 369.0, 197.0, 126.0, 94.0, 55.0, 23.0, 13.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-37.25, -36.09375, -34.9375, -33.78125, -32.625, -31.46875, -30.3125, -29.15625, -28.0, -26.84375, -25.6875, -24.53125, -23.375, -22.21875, -21.0625, -19.90625, -18.75, -17.59375, -16.4375, -15.28125, -14.125, -12.96875, -11.8125, -10.65625, -9.5, -8.34375, -7.1875, -6.03125, -4.875, -3.71875, -2.5625, -1.40625, -0.25, 0.90625, 2.0625, 3.21875, 4.375, 5.53125, 6.6875, 7.84375, 9.0, 10.15625, 11.3125, 12.46875, 13.625, 14.78125, 15.9375, 17.09375, 18.25, 19.40625, 20.5625, 21.71875, 22.875, 24.03125, 25.1875, 26.34375, 27.5, 28.65625, 29.8125, 30.96875, 32.125, 33.28125, 34.4375, 35.59375, 36.75]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 9.0, 9.0, 12.0, 11.0, 25.0, 22.0, 17.0, 28.0, 21.0, 24.0, 22.0, 26.0, 33.0, 28.0, 30.0, 39.0, 37.0, 30.0, 28.0, 42.0, 36.0, 30.0, 41.0, 43.0, 37.0, 30.0, 34.0, 34.0, 25.0, 24.0, 20.0, 22.0, 17.0, 17.0, 17.0, 8.0, 5.0, 11.0, 6.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-49.65625, -47.90234375, -46.1484375, -44.39453125, -42.640625, -40.88671875, -39.1328125, -37.37890625, -35.625, -33.87109375, -32.1171875, -30.36328125, -28.609375, -26.85546875, -25.1015625, -23.34765625, -21.59375, -19.83984375, -18.0859375, -16.33203125, -14.578125, -12.82421875, -11.0703125, -9.31640625, -7.5625, -5.80859375, -4.0546875, -2.30078125, -0.546875, 1.20703125, 2.9609375, 4.71484375, 6.46875, 8.22265625, 9.9765625, 11.73046875, 13.484375, 15.23828125, 16.9921875, 18.74609375, 20.5, 22.25390625, 24.0078125, 25.76171875, 27.515625, 29.26953125, 31.0234375, 32.77734375, 34.53125, 36.28515625, 38.0390625, 39.79296875, 41.546875, 43.30078125, 45.0546875, 46.80859375, 48.5625, 50.31640625, 52.0703125, 53.82421875, 55.578125, 57.33203125, 59.0859375, 60.83984375, 62.59375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 9.0, 23.0, 32.0, 43.0, 72.0, 117.0, 166.0, 246.0, 432.0, 628.0, 1004.0, 1526.0, 2285.0, 3433.0, 4993.0, 7187.0, 10428.0, 14558.0, 20210.0, 26655.0, 34445.0, 44101.0, 53701.0, 63620.0, 72353.0, 78222.0, 81872.0, 82336.0, 78863.0, 72505.0, 64138.0, 54054.0, 44333.0, 34699.0, 27237.0, 20022.0, 14824.0, 10568.0, 7432.0, 5169.0, 3269.0, 2332.0, 1549.0, 1013.0, 649.0, 422.0, 287.0, 181.0, 121.0, 68.0, 51.0, 24.0, 27.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-31.125, -30.12158203125, -29.1181640625, -28.11474609375, -27.111328125, -26.10791015625, -25.1044921875, -24.10107421875, -23.09765625, -22.09423828125, -21.0908203125, -20.08740234375, -19.083984375, -18.08056640625, -17.0771484375, -16.07373046875, -15.0703125, -14.06689453125, -13.0634765625, -12.06005859375, -11.056640625, -10.05322265625, -9.0498046875, -8.04638671875, -7.04296875, -6.03955078125, -5.0361328125, -4.03271484375, -3.029296875, -2.02587890625, -1.0224609375, -0.01904296875, 0.984375, 1.98779296875, 2.9912109375, 3.99462890625, 4.998046875, 6.00146484375, 7.0048828125, 8.00830078125, 9.01171875, 10.01513671875, 11.0185546875, 12.02197265625, 13.025390625, 14.02880859375, 15.0322265625, 16.03564453125, 17.0390625, 18.04248046875, 19.0458984375, 20.04931640625, 21.052734375, 22.05615234375, 23.0595703125, 24.06298828125, 25.06640625, 26.06982421875, 27.0732421875, 28.07666015625, 29.080078125, 30.08349609375, 31.0869140625, 32.09033203125, 33.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 9.0, 3.0, 12.0, 12.0, 10.0, 15.0, 18.0, 24.0, 31.0, 36.0, 22.0, 36.0, 25.0, 46.0, 36.0, 24.0, 31.0, 49.0, 41.0, 45.0, 46.0, 35.0, 35.0, 42.0, 37.0, 35.0, 32.0, 41.0, 22.0, 18.0, 14.0, 13.0, 18.0, 16.0, 9.0, 6.0, 8.0, 6.0, 9.0, 7.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.5625, -39.32861328125, -38.0947265625, -36.86083984375, -35.626953125, -34.39306640625, -33.1591796875, -31.92529296875, -30.69140625, -29.45751953125, -28.2236328125, -26.98974609375, -25.755859375, -24.52197265625, -23.2880859375, -22.05419921875, -20.8203125, -19.58642578125, -18.3525390625, -17.11865234375, -15.884765625, -14.65087890625, -13.4169921875, -12.18310546875, -10.94921875, -9.71533203125, -8.4814453125, -7.24755859375, -6.013671875, -4.77978515625, -3.5458984375, -2.31201171875, -1.078125, 0.15576171875, 1.3896484375, 2.62353515625, 3.857421875, 5.09130859375, 6.3251953125, 7.55908203125, 8.79296875, 10.02685546875, 11.2607421875, 12.49462890625, 13.728515625, 14.96240234375, 16.1962890625, 17.43017578125, 18.6640625, 19.89794921875, 21.1318359375, 22.36572265625, 23.599609375, 24.83349609375, 26.0673828125, 27.30126953125, 28.53515625, 29.76904296875, 31.0029296875, 32.23681640625, 33.470703125, 34.70458984375, 35.9384765625, 37.17236328125, 38.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 12.0, 22.0, 21.0, 44.0, 89.0, 129.0, 197.0, 319.0, 462.0, 800.0, 1206.0, 1957.0, 2969.0, 4681.0, 7477.0, 11325.0, 16883.0, 25114.0, 35107.0, 47775.0, 62118.0, 76535.0, 88967.0, 97963.0, 100552.0, 96898.0, 87565.0, 74443.0, 59414.0, 45460.0, 33374.0, 23403.0, 15913.0, 10544.0, 6800.0, 4335.0, 2758.0, 1802.0, 1187.0, 685.0, 398.0, 289.0, 202.0, 126.0, 79.0, 50.0, 39.0, 27.0, 16.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.546875, -15.052001953125, -14.55712890625, -14.062255859375, -13.5673828125, -13.072509765625, -12.57763671875, -12.082763671875, -11.587890625, -11.093017578125, -10.59814453125, -10.103271484375, -9.6083984375, -9.113525390625, -8.61865234375, -8.123779296875, -7.62890625, -7.134033203125, -6.63916015625, -6.144287109375, -5.6494140625, -5.154541015625, -4.65966796875, -4.164794921875, -3.669921875, -3.175048828125, -2.68017578125, -2.185302734375, -1.6904296875, -1.195556640625, -0.70068359375, -0.205810546875, 0.2890625, 0.783935546875, 1.27880859375, 1.773681640625, 2.2685546875, 2.763427734375, 3.25830078125, 3.753173828125, 4.248046875, 4.742919921875, 5.23779296875, 5.732666015625, 6.2275390625, 6.722412109375, 7.21728515625, 7.712158203125, 8.20703125, 8.701904296875, 9.19677734375, 9.691650390625, 10.1865234375, 10.681396484375, 11.17626953125, 11.671142578125, 12.166015625, 12.660888671875, 13.15576171875, 13.650634765625, 14.1455078125, 14.640380859375, 15.13525390625, 15.630126953125, 16.125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 3.0, 7.0, 3.0, 13.0, 10.0, 11.0, 10.0, 22.0, 21.0, 22.0, 26.0, 33.0, 33.0, 37.0, 44.0, 37.0, 34.0, 44.0, 37.0, 39.0, 49.0, 38.0, 42.0, 50.0, 39.0, 45.0, 28.0, 34.0, 28.0, 23.0, 22.0, 23.0, 13.0, 6.0, 14.0, 16.0, 11.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020885467529296875, -0.002025127410888672, -0.0019617080688476562, -0.0018982887268066406, -0.001834869384765625, -0.0017714500427246094, -0.0017080307006835938, -0.0016446113586425781, -0.0015811920166015625, -0.0015177726745605469, -0.0014543533325195312, -0.0013909339904785156, -0.0013275146484375, -0.0012640953063964844, -0.0012006759643554688, -0.0011372566223144531, -0.0010738372802734375, -0.0010104179382324219, -0.0009469985961914062, -0.0008835792541503906, -0.000820159912109375, -0.0007567405700683594, -0.0006933212280273438, -0.0006299018859863281, -0.0005664825439453125, -0.0005030632019042969, -0.00043964385986328125, -0.0003762245178222656, -0.00031280517578125, -0.0002493858337402344, -0.00018596649169921875, -0.00012254714965820312, -5.91278076171875e-05, 4.291534423828125e-06, 6.771087646484375e-05, 0.00013113021850585938, 0.000194549560546875, 0.0002579689025878906, 0.00032138824462890625, 0.0003848075866699219, 0.0004482269287109375, 0.0005116462707519531, 0.0005750656127929688, 0.0006384849548339844, 0.000701904296875, 0.0007653236389160156, 0.0008287429809570312, 0.0008921623229980469, 0.0009555816650390625, 0.0010190010070800781, 0.0010824203491210938, 0.0011458396911621094, 0.001209259033203125, 0.0012726783752441406, 0.0013360977172851562, 0.0013995170593261719, 0.0014629364013671875, 0.0015263557434082031, 0.0015897750854492188, 0.0016531944274902344, 0.00171661376953125, 0.0017800331115722656, 0.0018434524536132812, 0.0019068717956542969, 0.0019702911376953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 25.0, 43.0, 58.0, 84.0, 156.0, 269.0, 397.0, 692.0, 1048.0, 1642.0, 2656.0, 4294.0, 6642.0, 10369.0, 15784.0, 23907.0, 35077.0, 48876.0, 65059.0, 81997.0, 97103.0, 106551.0, 108292.0, 101046.0, 88325.0, 72140.0, 55019.0, 40034.0, 28203.0, 18901.0, 12270.0, 8023.0, 5202.0, 3163.0, 1971.0, 1233.0, 734.0, 496.0, 306.0, 168.0, 94.0, 76.0, 46.0, 30.0, 19.0, 8.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.65625, -20.05224609375, -19.4482421875, -18.84423828125, -18.240234375, -17.63623046875, -17.0322265625, -16.42822265625, -15.82421875, -15.22021484375, -14.6162109375, -14.01220703125, -13.408203125, -12.80419921875, -12.2001953125, -11.59619140625, -10.9921875, -10.38818359375, -9.7841796875, -9.18017578125, -8.576171875, -7.97216796875, -7.3681640625, -6.76416015625, -6.16015625, -5.55615234375, -4.9521484375, -4.34814453125, -3.744140625, -3.14013671875, -2.5361328125, -1.93212890625, -1.328125, -0.72412109375, -0.1201171875, 0.48388671875, 1.087890625, 1.69189453125, 2.2958984375, 2.89990234375, 3.50390625, 4.10791015625, 4.7119140625, 5.31591796875, 5.919921875, 6.52392578125, 7.1279296875, 7.73193359375, 8.3359375, 8.93994140625, 9.5439453125, 10.14794921875, 10.751953125, 11.35595703125, 11.9599609375, 12.56396484375, 13.16796875, 13.77197265625, 14.3759765625, 14.97998046875, 15.583984375, 16.18798828125, 16.7919921875, 17.39599609375, 18.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 2.0, 6.0, 12.0, 7.0, 10.0, 14.0, 12.0, 22.0, 16.0, 31.0, 27.0, 18.0, 20.0, 36.0, 29.0, 37.0, 37.0, 40.0, 50.0, 47.0, 51.0, 40.0, 27.0, 39.0, 47.0, 42.0, 34.0, 37.0, 28.0, 22.0, 23.0, 20.0, 22.0, 14.0, 19.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.8671875, -7.6195068359375, -7.371826171875, -7.1241455078125, -6.87646484375, -6.6287841796875, -6.381103515625, -6.1334228515625, -5.8857421875, -5.6380615234375, -5.390380859375, -5.1427001953125, -4.89501953125, -4.6473388671875, -4.399658203125, -4.1519775390625, -3.904296875, -3.6566162109375, -3.408935546875, -3.1612548828125, -2.91357421875, -2.6658935546875, -2.418212890625, -2.1705322265625, -1.9228515625, -1.6751708984375, -1.427490234375, -1.1798095703125, -0.93212890625, -0.6844482421875, -0.436767578125, -0.1890869140625, 0.05859375, 0.3062744140625, 0.553955078125, 0.8016357421875, 1.04931640625, 1.2969970703125, 1.544677734375, 1.7923583984375, 2.0400390625, 2.2877197265625, 2.535400390625, 2.7830810546875, 3.03076171875, 3.2784423828125, 3.526123046875, 3.7738037109375, 4.021484375, 4.2691650390625, 4.516845703125, 4.7645263671875, 5.01220703125, 5.2598876953125, 5.507568359375, 5.7552490234375, 6.0029296875, 6.2506103515625, 6.498291015625, 6.7459716796875, 6.99365234375, 7.2413330078125, 7.489013671875, 7.7366943359375, 7.984375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 14.0, 6.0, 11.0, 12.0, 16.0, 22.0, 12.0, 18.0, 24.0, 31.0, 25.0, 27.0, 35.0, 38.0, 30.0, 49.0, 42.0, 43.0, 53.0, 47.0, 35.0, 35.0, 42.0, 31.0, 33.0, 30.0, 27.0, 24.0, 29.0, 27.0, 22.0, 15.0, 14.0, 19.0, 3.0, 13.0, 8.0, 4.0, 8.0, 6.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.916141510009766, -59.020442962646484, -57.12474060058594, -55.229042053222656, -53.333343505859375, -51.437644958496094, -49.54194259643555, -47.646244049072266, -45.75054168701172, -43.85484313964844, -41.95914077758789, -40.06344223022461, -38.16774368286133, -36.27204132080078, -34.3763427734375, -32.48064422607422, -30.584945678710938, -28.689245223999023, -26.793546676635742, -24.897846221923828, -23.002147674560547, -21.106447219848633, -19.21074676513672, -17.315048217773438, -15.419347763061523, -13.523648262023926, -11.627948760986328, -9.732248306274414, -7.836548805236816, -5.940849304199219, -4.045148849487305, -2.149449348449707, -0.25374603271484375, 1.641953706741333, 3.5376534461975098, 5.433353424072266, 7.329052925109863, 9.224752426147461, 11.120452880859375, 13.016152381896973, 14.91185188293457, 16.807552337646484, 18.703250885009766, 20.59895133972168, 22.494651794433594, 24.390350341796875, 26.28605079650879, 28.181751251220703, 30.077449798583984, 31.9731502532959, 33.86885070800781, 35.764549255371094, 37.660247802734375, 39.555946350097656, 41.4516487121582, 43.347347259521484, 45.24304962158203, 47.13874816894531, 49.03445053100586, 50.93014907836914, 52.82584762573242, 54.72154998779297, 56.61724853515625, 58.51294708251953, 60.40864562988281]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 2.0, 5.0, 3.0, 7.0, 15.0, 10.0, 12.0, 18.0, 23.0, 21.0, 24.0, 28.0, 22.0, 29.0, 29.0, 27.0, 27.0, 30.0, 32.0, 36.0, 40.0, 45.0, 29.0, 32.0, 40.0, 28.0, 33.0, 42.0, 30.0, 38.0, 21.0, 27.0, 31.0, 29.0, 20.0, 24.0, 12.0, 14.0, 10.0, 6.0, 10.0, 6.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.048343658447266, -52.148345947265625, -50.24835205078125, -48.34835433959961, -46.44835662841797, -44.548362731933594, -42.64836502075195, -40.74836730957031, -38.84837341308594, -36.9483757019043, -35.04838180541992, -33.14838409423828, -31.248388290405273, -29.348392486572266, -27.448394775390625, -25.548398971557617, -23.64840316772461, -21.7484073638916, -19.848411560058594, -17.948413848876953, -16.048418045043945, -14.148422241210938, -12.248425483703613, -10.348428726196289, -8.448432922363281, -6.548436641693115, -4.648440361022949, -2.748444080352783, -0.8484477996826172, 1.0515480041503906, 2.951544761657715, 4.851541519165039, 6.751533508300781, 8.651529312133789, 10.551526069641113, 12.451522827148438, 14.351518630981445, 16.251514434814453, 18.151512145996094, 20.0515079498291, 21.95150375366211, 23.851499557495117, 25.751495361328125, 27.651493072509766, 29.551488876342773, 31.45148468017578, 33.35148239135742, 35.25148010253906, 37.15147399902344, 39.05147171020508, 40.95146560668945, 42.851463317871094, 44.75145721435547, 46.65145492553711, 48.55145263671875, 50.451446533203125, 52.351444244384766, 54.251441955566406, 56.15143585205078, 58.05143356323242, 59.95143127441406, 61.85142517089844, 63.75142288208008, 65.65142059326172, 67.5514144897461]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 17.0, 24.0, 33.0, 73.0, 118.0, 201.0, 353.0, 614.0, 970.0, 1711.0, 2653.0, 4267.0, 6951.0, 11057.0, 16992.0, 26008.0, 39481.0, 58360.0, 84901.0, 118129.0, 160822.0, 211544.0, 263590.0, 316971.0, 357499.0, 382161.0, 383733.0, 363903.0, 323348.0, 272912.0, 218901.0, 168699.0, 125246.0, 89028.0, 62778.0, 42033.0, 28081.0, 18458.0, 11850.0, 7437.0, 4745.0, 2932.0, 1778.0, 1114.0, 719.0, 422.0, 261.0, 147.0, 103.0, 62.0, 35.0, 25.0, 14.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.4619140625, -36.173828125, -34.8857421875, -33.59765625, -32.3095703125, -31.021484375, -29.7333984375, -28.4453125, -27.1572265625, -25.869140625, -24.5810546875, -23.29296875, -22.0048828125, -20.716796875, -19.4287109375, -18.140625, -16.8525390625, -15.564453125, -14.2763671875, -12.98828125, -11.7001953125, -10.412109375, -9.1240234375, -7.8359375, -6.5478515625, -5.259765625, -3.9716796875, -2.68359375, -1.3955078125, -0.107421875, 1.1806640625, 2.46875, 3.7568359375, 5.044921875, 6.3330078125, 7.62109375, 8.9091796875, 10.197265625, 11.4853515625, 12.7734375, 14.0615234375, 15.349609375, 16.6376953125, 17.92578125, 19.2138671875, 20.501953125, 21.7900390625, 23.078125, 24.3662109375, 25.654296875, 26.9423828125, 28.23046875, 29.5185546875, 30.806640625, 32.0947265625, 33.3828125, 34.6708984375, 35.958984375, 37.2470703125, 38.53515625, 39.8232421875, 41.111328125, 42.3994140625, 43.6875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 9.0, 15.0, 9.0, 18.0, 17.0, 24.0, 20.0, 31.0, 25.0, 21.0, 30.0, 36.0, 24.0, 25.0, 34.0, 39.0, 32.0, 41.0, 42.0, 32.0, 40.0, 29.0, 31.0, 45.0, 29.0, 34.0, 33.0, 24.0, 25.0, 37.0, 19.0, 26.0, 11.0, 15.0, 11.0, 7.0, 9.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.46875, -46.72705078125, -44.9853515625, -43.24365234375, -41.501953125, -39.76025390625, -38.0185546875, -36.27685546875, -34.53515625, -32.79345703125, -31.0517578125, -29.31005859375, -27.568359375, -25.82666015625, -24.0849609375, -22.34326171875, -20.6015625, -18.85986328125, -17.1181640625, -15.37646484375, -13.634765625, -11.89306640625, -10.1513671875, -8.40966796875, -6.66796875, -4.92626953125, -3.1845703125, -1.44287109375, 0.298828125, 2.04052734375, 3.7822265625, 5.52392578125, 7.265625, 9.00732421875, 10.7490234375, 12.49072265625, 14.232421875, 15.97412109375, 17.7158203125, 19.45751953125, 21.19921875, 22.94091796875, 24.6826171875, 26.42431640625, 28.166015625, 29.90771484375, 31.6494140625, 33.39111328125, 35.1328125, 36.87451171875, 38.6162109375, 40.35791015625, 42.099609375, 43.84130859375, 45.5830078125, 47.32470703125, 49.06640625, 50.80810546875, 52.5498046875, 54.29150390625, 56.033203125, 57.77490234375, 59.5166015625, 61.25830078125, 63.0]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 28.0, 46.0, 84.0, 148.0, 252.0, 369.0, 622.0, 1061.0, 1709.0, 2756.0, 4360.0, 6850.0, 10948.0, 16603.0, 24801.0, 37314.0, 53669.0, 75767.0, 104097.0, 139289.0, 179036.0, 222311.0, 265658.0, 303367.0, 332588.0, 347208.0, 345121.0, 327577.0, 297288.0, 258002.0, 214419.0, 171073.0, 131602.0, 97494.0, 70836.0, 50413.0, 34444.0, 22847.0, 15467.0, 9894.0, 6457.0, 3948.0, 2520.0, 1557.0, 961.0, 572.0, 360.0, 192.0, 128.0, 70.0, 42.0, 27.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.8125, -39.533203125, -38.25390625, -36.974609375, -35.6953125, -34.416015625, -33.13671875, -31.857421875, -30.578125, -29.298828125, -28.01953125, -26.740234375, -25.4609375, -24.181640625, -22.90234375, -21.623046875, -20.34375, -19.064453125, -17.78515625, -16.505859375, -15.2265625, -13.947265625, -12.66796875, -11.388671875, -10.109375, -8.830078125, -7.55078125, -6.271484375, -4.9921875, -3.712890625, -2.43359375, -1.154296875, 0.125, 1.404296875, 2.68359375, 3.962890625, 5.2421875, 6.521484375, 7.80078125, 9.080078125, 10.359375, 11.638671875, 12.91796875, 14.197265625, 15.4765625, 16.755859375, 18.03515625, 19.314453125, 20.59375, 21.873046875, 23.15234375, 24.431640625, 25.7109375, 26.990234375, 28.26953125, 29.548828125, 30.828125, 32.107421875, 33.38671875, 34.666015625, 35.9453125, 37.224609375, 38.50390625, 39.783203125, 41.0625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 12.0, 12.0, 11.0, 17.0, 26.0, 23.0, 33.0, 56.0, 48.0, 74.0, 77.0, 85.0, 110.0, 113.0, 125.0, 146.0, 139.0, 153.0, 152.0, 186.0, 182.0, 193.0, 180.0, 176.0, 162.0, 164.0, 178.0, 152.0, 133.0, 129.0, 115.0, 114.0, 96.0, 74.0, 82.0, 59.0, 44.0, 53.0, 41.0, 32.0, 35.0, 16.0, 15.0, 7.0, 7.0, 13.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.59375, -23.836669921875, -23.07958984375, -22.322509765625, -21.5654296875, -20.808349609375, -20.05126953125, -19.294189453125, -18.537109375, -17.780029296875, -17.02294921875, -16.265869140625, -15.5087890625, -14.751708984375, -13.99462890625, -13.237548828125, -12.48046875, -11.723388671875, -10.96630859375, -10.209228515625, -9.4521484375, -8.695068359375, -7.93798828125, -7.180908203125, -6.423828125, -5.666748046875, -4.90966796875, -4.152587890625, -3.3955078125, -2.638427734375, -1.88134765625, -1.124267578125, -0.3671875, 0.389892578125, 1.14697265625, 1.904052734375, 2.6611328125, 3.418212890625, 4.17529296875, 4.932373046875, 5.689453125, 6.446533203125, 7.20361328125, 7.960693359375, 8.7177734375, 9.474853515625, 10.23193359375, 10.989013671875, 11.74609375, 12.503173828125, 13.26025390625, 14.017333984375, 14.7744140625, 15.531494140625, 16.28857421875, 17.045654296875, 17.802734375, 18.559814453125, 19.31689453125, 20.073974609375, 20.8310546875, 21.588134765625, 22.34521484375, 23.102294921875, 23.859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 7.0, 8.0, 17.0, 14.0, 16.0, 22.0, 21.0, 22.0, 31.0, 30.0, 36.0, 30.0, 30.0, 43.0, 43.0, 56.0, 48.0, 45.0, 35.0, 27.0, 38.0, 40.0, 32.0, 27.0, 37.0, 28.0, 23.0, 22.0, 25.0, 20.0, 14.0, 8.0, 10.0, 14.0, 12.0, 8.0, 12.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.678443908691406, -55.83201599121094, -53.98558807373047, -52.13916015625, -50.29273223876953, -48.44630432128906, -46.599876403808594, -44.753448486328125, -42.907020568847656, -41.06059265136719, -39.21416473388672, -37.36773681640625, -35.52130889892578, -33.67488098144531, -31.828453063964844, -29.982025146484375, -28.135595321655273, -26.289167404174805, -24.442739486694336, -22.596311569213867, -20.7498836517334, -18.903453826904297, -17.057025909423828, -15.210598945617676, -13.364171028137207, -11.517743110656738, -9.67131519317627, -7.824886798858643, -5.978458881378174, -4.132030487060547, -2.285602569580078, -0.4391746520996094, 1.4072532653808594, 3.253681182861328, 5.100109100341797, 6.946537494659424, 8.792964935302734, 10.63939380645752, 12.485821723937988, 14.332249641418457, 16.17867660522461, 18.025104522705078, 19.871532440185547, 21.717960357666016, 23.564388275146484, 25.410816192626953, 27.257244110107422, 29.10367202758789, 30.950101852416992, 32.796531677246094, 34.64295959472656, 36.48938751220703, 38.3358154296875, 40.18224334716797, 42.02867126464844, 43.875099182128906, 45.721527099609375, 47.567955017089844, 49.41438293457031, 51.26081085205078, 53.10723876953125, 54.95366668701172, 56.80009460449219, 58.646522521972656, 60.492950439453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 10.0, 13.0, 7.0, 16.0, 20.0, 13.0, 23.0, 22.0, 20.0, 22.0, 25.0, 24.0, 32.0, 26.0, 41.0, 35.0, 42.0, 32.0, 35.0, 41.0, 38.0, 43.0, 42.0, 32.0, 25.0, 32.0, 29.0, 20.0, 26.0, 23.0, 27.0, 21.0, 17.0, 11.0, 10.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.211090087890625, -53.36396789550781, -51.516849517822266, -49.66972732543945, -47.822608947753906, -45.975486755371094, -44.12836456298828, -42.281246185302734, -40.43412780761719, -38.587005615234375, -36.73988723754883, -34.892765045166016, -33.04564666748047, -31.198524475097656, -29.351404190063477, -27.504283905029297, -25.657161712646484, -23.810041427612305, -21.962921142578125, -20.115798950195312, -18.268680572509766, -16.421558380126953, -14.574438095092773, -12.727317810058594, -10.880197525024414, -9.033077239990234, -7.1859564781188965, -5.338835716247559, -3.491715431213379, -1.6445951461791992, 0.20252609252929688, 2.0496463775634766, 3.8967628479003906, 5.74388313293457, 7.591003894805908, 9.438124656677246, 11.285244941711426, 13.132365226745605, 14.979486465454102, 16.82660675048828, 18.67372703552246, 20.52084732055664, 22.36796760559082, 24.215087890625, 26.062210083007812, 27.90932846069336, 29.756450653076172, 31.60357093811035, 33.45069122314453, 35.297813415527344, 37.14493179321289, 38.9920539855957, 40.83917236328125, 42.68629455566406, 44.533416748046875, 46.38053512573242, 48.22765350341797, 50.07477569580078, 51.92189407348633, 53.76901626586914, 55.61613464355469, 57.4632568359375, 59.31037902832031, 61.15749740600586, 63.00461959838867]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 21.0, 26.0, 34.0, 57.0, 84.0, 158.0, 224.0, 367.0, 575.0, 908.0, 1398.0, 2225.0, 3475.0, 5626.0, 8444.0, 13188.0, 19503.0, 29327.0, 42111.0, 58614.0, 76939.0, 95321.0, 108730.0, 113762.0, 110012.0, 95378.0, 76982.0, 58046.0, 41855.0, 29095.0, 19587.0, 12955.0, 8494.0, 5497.0, 3491.0, 2183.0, 1426.0, 886.0, 530.0, 321.0, 246.0, 171.0, 97.0, 61.0, 42.0, 25.0, 18.0, 7.0, 12.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.41015625, -8.125, -7.83984375, -7.5546875, -7.26953125, -6.984375, -6.69921875, -6.4140625, -6.12890625, -5.84375, -5.55859375, -5.2734375, -4.98828125, -4.703125, -4.41796875, -4.1328125, -3.84765625, -3.5625, -3.27734375, -2.9921875, -2.70703125, -2.421875, -2.13671875, -1.8515625, -1.56640625, -1.28125, -0.99609375, -0.7109375, -0.42578125, -0.140625, 0.14453125, 0.4296875, 0.71484375, 1.0, 1.28515625, 1.5703125, 1.85546875, 2.140625, 2.42578125, 2.7109375, 2.99609375, 3.28125, 3.56640625, 3.8515625, 4.13671875, 4.421875, 4.70703125, 4.9921875, 5.27734375, 5.5625, 5.84765625, 6.1328125, 6.41796875, 6.703125, 6.98828125, 7.2734375, 7.55859375, 7.84375, 8.12890625, 8.4140625, 8.69921875, 8.984375, 9.26953125, 9.5546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 4.0, 13.0, 11.0, 12.0, 8.0, 18.0, 16.0, 15.0, 23.0, 21.0, 21.0, 22.0, 26.0, 22.0, 30.0, 27.0, 41.0, 37.0, 42.0, 32.0, 37.0, 39.0, 38.0, 43.0, 41.0, 31.0, 27.0, 30.0, 29.0, 22.0, 26.0, 23.0, 27.0, 20.0, 16.0, 11.0, 12.0, 13.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.5, -53.64990234375, -51.7998046875, -49.94970703125, -48.099609375, -46.24951171875, -44.3994140625, -42.54931640625, -40.69921875, -38.84912109375, -36.9990234375, -35.14892578125, -33.298828125, -31.44873046875, -29.5986328125, -27.74853515625, -25.8984375, -24.04833984375, -22.1982421875, -20.34814453125, -18.498046875, -16.64794921875, -14.7978515625, -12.94775390625, -11.09765625, -9.24755859375, -7.3974609375, -5.54736328125, -3.697265625, -1.84716796875, 0.0029296875, 1.85302734375, 3.703125, 5.55322265625, 7.4033203125, 9.25341796875, 11.103515625, 12.95361328125, 14.8037109375, 16.65380859375, 18.50390625, 20.35400390625, 22.2041015625, 24.05419921875, 25.904296875, 27.75439453125, 29.6044921875, 31.45458984375, 33.3046875, 35.15478515625, 37.0048828125, 38.85498046875, 40.705078125, 42.55517578125, 44.4052734375, 46.25537109375, 48.10546875, 49.95556640625, 51.8056640625, 53.65576171875, 55.505859375, 57.35595703125, 59.2060546875, 61.05615234375, 62.90625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 12.0, 18.0, 26.0, 47.0, 72.0, 123.0, 184.0, 308.0, 486.0, 825.0, 1305.0, 2129.0, 3541.0, 5729.0, 9385.0, 15718.0, 28512.0, 188235.0, 705318.0, 38353.0, 19296.0, 11278.0, 6842.0, 4320.0, 2490.0, 1583.0, 906.0, 611.0, 346.0, 208.0, 124.0, 90.0, 40.0, 36.0, 17.0, 10.0, 11.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.46875, -24.625, -23.78125, -22.9375, -22.09375, -21.25, -20.40625, -19.5625, -18.71875, -17.875, -17.03125, -16.1875, -15.34375, -14.5, -13.65625, -12.8125, -11.96875, -11.125, -10.28125, -9.4375, -8.59375, -7.75, -6.90625, -6.0625, -5.21875, -4.375, -3.53125, -2.6875, -1.84375, -1.0, -0.15625, 0.6875, 1.53125, 2.375, 3.21875, 4.0625, 4.90625, 5.75, 6.59375, 7.4375, 8.28125, 9.125, 9.96875, 10.8125, 11.65625, 12.5, 13.34375, 14.1875, 15.03125, 15.875, 16.71875, 17.5625, 18.40625, 19.25, 20.09375, 20.9375, 21.78125, 22.625, 23.46875, 24.3125, 25.15625, 26.0, 26.84375, 27.6875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 15.0, 16.0, 8.0, 15.0, 20.0, 17.0, 27.0, 27.0, 28.0, 16.0, 28.0, 29.0, 37.0, 33.0, 42.0, 52.0, 35.0, 37.0, 48.0, 42.0, 38.0, 38.0, 32.0, 24.0, 27.0, 30.0, 34.0, 29.0, 16.0, 28.0, 12.0, 19.0, 22.0, 12.0, 12.0, 6.0, 7.0, 7.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5, -41.146484375, -39.79296875, -38.439453125, -37.0859375, -35.732421875, -34.37890625, -33.025390625, -31.671875, -30.318359375, -28.96484375, -27.611328125, -26.2578125, -24.904296875, -23.55078125, -22.197265625, -20.84375, -19.490234375, -18.13671875, -16.783203125, -15.4296875, -14.076171875, -12.72265625, -11.369140625, -10.015625, -8.662109375, -7.30859375, -5.955078125, -4.6015625, -3.248046875, -1.89453125, -0.541015625, 0.8125, 2.166015625, 3.51953125, 4.873046875, 6.2265625, 7.580078125, 8.93359375, 10.287109375, 11.640625, 12.994140625, 14.34765625, 15.701171875, 17.0546875, 18.408203125, 19.76171875, 21.115234375, 22.46875, 23.822265625, 25.17578125, 26.529296875, 27.8828125, 29.236328125, 30.58984375, 31.943359375, 33.296875, 34.650390625, 36.00390625, 37.357421875, 38.7109375, 40.064453125, 41.41796875, 42.771484375, 44.125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 20.0, 41.0, 52.0, 83.0, 143.0, 242.0, 376.0, 639.0, 1045.0, 1909.0, 3189.0, 5542.0, 10340.0, 19016.0, 38119.0, 810029.0, 99065.0, 26876.0, 14119.0, 7556.0, 4256.0, 2315.0, 1404.0, 823.0, 481.0, 306.0, 197.0, 102.0, 70.0, 43.0, 32.0, 29.0, 7.0, 7.0, 15.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.09765625, -3.003082275390625, -2.90850830078125, -2.813934326171875, -2.7193603515625, -2.624786376953125, -2.53021240234375, -2.435638427734375, -2.341064453125, -2.246490478515625, -2.15191650390625, -2.057342529296875, -1.9627685546875, -1.868194580078125, -1.77362060546875, -1.679046630859375, -1.58447265625, -1.489898681640625, -1.39532470703125, -1.300750732421875, -1.2061767578125, -1.111602783203125, -1.01702880859375, -0.922454833984375, -0.827880859375, -0.733306884765625, -0.63873291015625, -0.544158935546875, -0.4495849609375, -0.355010986328125, -0.26043701171875, -0.165863037109375, -0.0712890625, 0.023284912109375, 0.11785888671875, 0.212432861328125, 0.3070068359375, 0.401580810546875, 0.49615478515625, 0.590728759765625, 0.685302734375, 0.779876708984375, 0.87445068359375, 0.969024658203125, 1.0635986328125, 1.158172607421875, 1.25274658203125, 1.347320556640625, 1.44189453125, 1.536468505859375, 1.63104248046875, 1.725616455078125, 1.8201904296875, 1.914764404296875, 2.00933837890625, 2.103912353515625, 2.198486328125, 2.293060302734375, 2.38763427734375, 2.482208251953125, 2.5767822265625, 2.671356201171875, 2.76593017578125, 2.860504150390625, 2.955078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 13.0, 13.0, 10.0, 17.0, 24.0, 28.0, 27.0, 35.0, 28.0, 53.0, 39.0, 44.0, 53.0, 38.0, 50.0, 46.0, 57.0, 49.0, 56.0, 42.0, 31.0, 43.0, 16.0, 35.0, 27.0, 19.0, 23.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.18832015991211e-05, -6.942730396986008e-05, -6.697140634059906e-05, -6.451550871133804e-05, -6.205961108207703e-05, -5.960371345281601e-05, -5.714781582355499e-05, -5.4691918194293976e-05, -5.223602056503296e-05, -4.978012293577194e-05, -4.7324225306510925e-05, -4.486832767724991e-05, -4.241243004798889e-05, -3.9956532418727875e-05, -3.750063478946686e-05, -3.504473716020584e-05, -3.2588839530944824e-05, -3.0132941901683807e-05, -2.767704427242279e-05, -2.5221146643161774e-05, -2.2765249013900757e-05, -2.030935138463974e-05, -1.7853453755378723e-05, -1.5397556126117706e-05, -1.294165849685669e-05, -1.0485760867595673e-05, -8.029863238334656e-06, -5.573965609073639e-06, -3.118067979812622e-06, -6.621703505516052e-07, 1.7937272787094116e-06, 4.2496249079704285e-06, 6.705522537231445e-06, 9.161420166492462e-06, 1.1617317795753479e-05, 1.4073215425014496e-05, 1.6529113054275513e-05, 1.898501068353653e-05, 2.1440908312797546e-05, 2.3896805942058563e-05, 2.635270357131958e-05, 2.8808601200580597e-05, 3.1264498829841614e-05, 3.372039645910263e-05, 3.617629408836365e-05, 3.8632191717624664e-05, 4.108808934688568e-05, 4.35439869761467e-05, 4.5999884605407715e-05, 4.845578223466873e-05, 5.091167986392975e-05, 5.3367577493190765e-05, 5.582347512245178e-05, 5.82793727517128e-05, 6.0735270380973816e-05, 6.319116801023483e-05, 6.564706563949585e-05, 6.810296326875687e-05, 7.055886089801788e-05, 7.30147585272789e-05, 7.547065615653992e-05, 7.792655378580093e-05, 8.038245141506195e-05, 8.283834904432297e-05, 8.529424667358398e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 13.0, 13.0, 13.0, 18.0, 33.0, 54.0, 77.0, 104.0, 150.0, 253.0, 367.0, 536.0, 858.0, 1191.0, 1768.0, 2835.0, 4035.0, 5958.0, 8636.0, 12688.0, 18162.0, 26145.0, 36278.0, 49491.0, 66957.0, 87508.0, 107380.0, 120014.0, 116103.0, 98612.0, 77811.0, 59087.0, 42981.0, 31210.0, 22032.0, 15446.0, 10753.0, 7575.0, 5203.0, 3440.0, 2262.0, 1436.0, 1032.0, 702.0, 441.0, 294.0, 216.0, 142.0, 86.0, 57.0, 30.0, 24.0, 15.0, 19.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.9775390625, -1.9132843017578125, -1.849029541015625, -1.7847747802734375, -1.72052001953125, -1.6562652587890625, -1.592010498046875, -1.5277557373046875, -1.4635009765625, -1.3992462158203125, -1.334991455078125, -1.2707366943359375, -1.20648193359375, -1.1422271728515625, -1.077972412109375, -1.0137176513671875, -0.949462890625, -0.8852081298828125, -0.820953369140625, -0.7566986083984375, -0.69244384765625, -0.6281890869140625, -0.563934326171875, -0.4996795654296875, -0.4354248046875, -0.3711700439453125, -0.306915283203125, -0.2426605224609375, -0.17840576171875, -0.1141510009765625, -0.049896240234375, 0.0143585205078125, 0.07861328125, 0.1428680419921875, 0.207122802734375, 0.2713775634765625, 0.33563232421875, 0.3998870849609375, 0.464141845703125, 0.5283966064453125, 0.5926513671875, 0.6569061279296875, 0.721160888671875, 0.7854156494140625, 0.84967041015625, 0.9139251708984375, 0.978179931640625, 1.0424346923828125, 1.106689453125, 1.1709442138671875, 1.235198974609375, 1.2994537353515625, 1.36370849609375, 1.4279632568359375, 1.492218017578125, 1.5564727783203125, 1.6207275390625, 1.6849822998046875, 1.749237060546875, 1.8134918212890625, 1.87774658203125, 1.9420013427734375, 2.006256103515625, 2.0705108642578125, 2.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 9.0, 14.0, 21.0, 16.0, 16.0, 22.0, 30.0, 29.0, 32.0, 41.0, 55.0, 53.0, 55.0, 66.0, 73.0, 70.0, 47.0, 50.0, 42.0, 38.0, 38.0, 18.0, 25.0, 18.0, 11.0, 15.0, 15.0, 14.0, 5.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.2724609375, -1.2373580932617188, -1.2022552490234375, -1.1671524047851562, -1.132049560546875, -1.0969467163085938, -1.0618438720703125, -1.0267410278320312, -0.99163818359375, -0.9565353393554688, -0.9214324951171875, -0.8863296508789062, -0.851226806640625, -0.8161239624023438, -0.7810211181640625, -0.7459182739257812, -0.7108154296875, -0.6757125854492188, -0.6406097412109375, -0.6055068969726562, -0.570404052734375, -0.5353012084960938, -0.5001983642578125, -0.46509552001953125, -0.42999267578125, -0.39488983154296875, -0.3597869873046875, -0.32468414306640625, -0.289581298828125, -0.25447845458984375, -0.2193756103515625, -0.18427276611328125, -0.149169921875, -0.11406707763671875, -0.0789642333984375, -0.04386138916015625, -0.008758544921875, 0.02634429931640625, 0.0614471435546875, 0.09654998779296875, 0.13165283203125, 0.16675567626953125, 0.2018585205078125, 0.23696136474609375, 0.272064208984375, 0.30716705322265625, 0.3422698974609375, 0.37737274169921875, 0.4124755859375, 0.44757843017578125, 0.4826812744140625, 0.5177841186523438, 0.552886962890625, 0.5879898071289062, 0.6230926513671875, 0.6581954956054688, 0.69329833984375, 0.7284011840820312, 0.7635040283203125, 0.7986068725585938, 0.833709716796875, 0.8688125610351562, 0.9039154052734375, 0.9390182495117188, 0.97412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 11.0, 5.0, 14.0, 14.0, 14.0, 16.0, 32.0, 17.0, 22.0, 39.0, 21.0, 33.0, 28.0, 36.0, 44.0, 46.0, 53.0, 44.0, 40.0, 40.0, 23.0, 33.0, 46.0, 31.0, 34.0, 28.0, 26.0, 20.0, 27.0, 21.0, 20.0, 14.0, 11.0, 12.0, 12.0, 9.0, 11.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.98395538330078, -54.17173767089844, -52.359519958496094, -50.54730224609375, -48.73508834838867, -46.92287063598633, -45.110652923583984, -43.29843521118164, -41.48622131347656, -39.67400360107422, -37.861785888671875, -36.04956817626953, -34.23735427856445, -32.42513656616211, -30.612918853759766, -28.800701141357422, -26.988483428955078, -25.176265716552734, -23.364049911499023, -21.55183219909668, -19.73961639404297, -17.927398681640625, -16.11518096923828, -14.302964210510254, -12.490747451782227, -10.6785306930542, -8.866313934326172, -7.054096221923828, -5.241879463195801, -3.4296627044677734, -1.6174449920654297, 0.19477176666259766, 2.0069847106933594, 3.819201707839966, 5.631418704986572, 7.443635940551758, 9.255852699279785, 11.068069458007812, 12.880287170410156, 14.692503929138184, 16.50472068786621, 18.316938400268555, 20.129154205322266, 21.94137191772461, 23.753589630126953, 25.565805435180664, 27.378023147583008, 29.19023895263672, 31.002456665039062, 32.814674377441406, 34.62689208984375, 36.439109802246094, 38.25132369995117, 40.063541412353516, 41.87575912475586, 43.6879768371582, 45.50019073486328, 47.312408447265625, 49.12462615966797, 50.93684387207031, 52.74905776977539, 54.561275482177734, 56.37349319458008, 58.18571090698242, 59.997928619384766]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 14.0, 13.0, 10.0, 11.0, 18.0, 13.0, 18.0, 22.0, 20.0, 21.0, 21.0, 26.0, 25.0, 31.0, 29.0, 38.0, 36.0, 47.0, 31.0, 33.0, 43.0, 39.0, 42.0, 38.0, 30.0, 28.0, 30.0, 32.0, 17.0, 28.0, 21.0, 28.0, 20.0, 14.0, 10.0, 10.0, 17.0, 12.0, 7.0, 9.0, 7.0, 2.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-55.297603607177734, -53.44639205932617, -51.59518051147461, -49.74396896362305, -47.892757415771484, -46.04154586791992, -44.19033432006836, -42.3391227722168, -40.487911224365234, -38.63669967651367, -36.78548812866211, -34.93427658081055, -33.083065032958984, -31.231853485107422, -29.38064193725586, -27.529430389404297, -25.6782169342041, -23.82700538635254, -21.975793838500977, -20.124582290649414, -18.27337074279785, -16.422157287597656, -14.57094669342041, -12.719735145568848, -10.868523597717285, -9.017312049865723, -7.16610050201416, -5.3148884773254395, -3.463676929473877, -1.6124649047851562, 0.23874664306640625, 2.0899581909179688, 3.9411697387695312, 5.792381286621094, 7.643592834472656, 9.494804382324219, 11.346015930175781, 13.19722843170166, 15.048439979553223, 16.89965057373047, 18.75086212158203, 20.602073669433594, 22.453285217285156, 24.30449676513672, 26.15570831298828, 28.006919860839844, 29.858131408691406, 31.70934295654297, 33.56055450439453, 35.411766052246094, 37.262977600097656, 39.11418914794922, 40.96540069580078, 42.816612243652344, 44.667823791503906, 46.51903533935547, 48.3702507019043, 50.22146224975586, 52.07267379760742, 53.923885345458984, 55.77509689331055, 57.62630844116211, 59.47751998901367, 61.328731536865234, 63.1799430847168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 13.0, 27.0, 32.0, 55.0, 93.0, 219.0, 285.0, 472.0, 765.0, 1171.0, 1894.0, 3047.0, 4525.0, 6671.0, 9830.0, 14092.0, 19649.0, 26839.0, 35505.0, 45629.0, 55900.0, 66583.0, 75422.0, 82225.0, 85696.0, 85174.0, 80537.0, 73010.0, 62959.0, 53357.0, 42916.0, 32958.0, 24469.0, 17951.0, 12818.0, 8650.0, 5938.0, 4074.0, 2626.0, 1605.0, 1089.0, 690.0, 436.0, 251.0, 163.0, 103.0, 56.0, 35.0, 20.0, 12.0, 8.0, 5.0, 5.0, 0.0, 1.0], "bins": [-36.75, -35.66455078125, -34.5791015625, -33.49365234375, -32.408203125, -31.32275390625, -30.2373046875, -29.15185546875, -28.06640625, -26.98095703125, -25.8955078125, -24.81005859375, -23.724609375, -22.63916015625, -21.5537109375, -20.46826171875, -19.3828125, -18.29736328125, -17.2119140625, -16.12646484375, -15.041015625, -13.95556640625, -12.8701171875, -11.78466796875, -10.69921875, -9.61376953125, -8.5283203125, -7.44287109375, -6.357421875, -5.27197265625, -4.1865234375, -3.10107421875, -2.015625, -0.93017578125, 0.1552734375, 1.24072265625, 2.326171875, 3.41162109375, 4.4970703125, 5.58251953125, 6.66796875, 7.75341796875, 8.8388671875, 9.92431640625, 11.009765625, 12.09521484375, 13.1806640625, 14.26611328125, 15.3515625, 16.43701171875, 17.5224609375, 18.60791015625, 19.693359375, 20.77880859375, 21.8642578125, 22.94970703125, 24.03515625, 25.12060546875, 26.2060546875, 27.29150390625, 28.376953125, 29.46240234375, 30.5478515625, 31.63330078125, 32.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 11.0, 12.0, 12.0, 11.0, 16.0, 18.0, 15.0, 23.0, 21.0, 18.0, 22.0, 29.0, 23.0, 33.0, 29.0, 42.0, 37.0, 45.0, 32.0, 29.0, 52.0, 40.0, 40.0, 38.0, 27.0, 28.0, 33.0, 25.0, 19.0, 30.0, 22.0, 28.0, 15.0, 19.0, 5.0, 14.0, 14.0, 11.0, 6.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.18017578125, -50.3603515625, -48.54052734375, -46.720703125, -44.90087890625, -43.0810546875, -41.26123046875, -39.44140625, -37.62158203125, -35.8017578125, -33.98193359375, -32.162109375, -30.34228515625, -28.5224609375, -26.70263671875, -24.8828125, -23.06298828125, -21.2431640625, -19.42333984375, -17.603515625, -15.78369140625, -13.9638671875, -12.14404296875, -10.32421875, -8.50439453125, -6.6845703125, -4.86474609375, -3.044921875, -1.22509765625, 0.5947265625, 2.41455078125, 4.234375, 6.05419921875, 7.8740234375, 9.69384765625, 11.513671875, 13.33349609375, 15.1533203125, 16.97314453125, 18.79296875, 20.61279296875, 22.4326171875, 24.25244140625, 26.072265625, 27.89208984375, 29.7119140625, 31.53173828125, 33.3515625, 35.17138671875, 36.9912109375, 38.81103515625, 40.630859375, 42.45068359375, 44.2705078125, 46.09033203125, 47.91015625, 49.72998046875, 51.5498046875, 53.36962890625, 55.189453125, 57.00927734375, 58.8291015625, 60.64892578125, 62.46875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 35.0, 47.0, 81.0, 135.0, 224.0, 350.0, 651.0, 1031.0, 1714.0, 2573.0, 4155.0, 6501.0, 9964.0, 14671.0, 21252.0, 29661.0, 39735.0, 51688.0, 64677.0, 76011.0, 86322.0, 91937.0, 92887.0, 88995.0, 81114.0, 69824.0, 57813.0, 45097.0, 34303.0, 24710.0, 17287.0, 11783.0, 7862.0, 5058.0, 3211.0, 1988.0, 1245.0, 807.0, 464.0, 260.0, 179.0, 104.0, 51.0, 46.0, 23.0, 12.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.875, -31.75, -30.625, -29.5, -28.375, -27.25, -26.125, -25.0, -23.875, -22.75, -21.625, -20.5, -19.375, -18.25, -17.125, -16.0, -14.875, -13.75, -12.625, -11.5, -10.375, -9.25, -8.125, -7.0, -5.875, -4.75, -3.625, -2.5, -1.375, -0.25, 0.875, 2.0, 3.125, 4.25, 5.375, 6.5, 7.625, 8.75, 9.875, 11.0, 12.125, 13.25, 14.375, 15.5, 16.625, 17.75, 18.875, 20.0, 21.125, 22.25, 23.375, 24.5, 25.625, 26.75, 27.875, 29.0, 30.125, 31.25, 32.375, 33.5, 34.625, 35.75, 36.875, 38.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 7.0, 16.0, 17.0, 18.0, 18.0, 16.0, 21.0, 27.0, 24.0, 31.0, 34.0, 43.0, 34.0, 35.0, 46.0, 40.0, 41.0, 42.0, 52.0, 51.0, 41.0, 33.0, 29.0, 39.0, 33.0, 22.0, 28.0, 16.0, 19.0, 16.0, 10.0, 5.0, 6.0, 13.0, 10.0, 9.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.6875, -39.34912109375, -38.0107421875, -36.67236328125, -35.333984375, -33.99560546875, -32.6572265625, -31.31884765625, -29.98046875, -28.64208984375, -27.3037109375, -25.96533203125, -24.626953125, -23.28857421875, -21.9501953125, -20.61181640625, -19.2734375, -17.93505859375, -16.5966796875, -15.25830078125, -13.919921875, -12.58154296875, -11.2431640625, -9.90478515625, -8.56640625, -7.22802734375, -5.8896484375, -4.55126953125, -3.212890625, -1.87451171875, -0.5361328125, 0.80224609375, 2.140625, 3.47900390625, 4.8173828125, 6.15576171875, 7.494140625, 8.83251953125, 10.1708984375, 11.50927734375, 12.84765625, 14.18603515625, 15.5244140625, 16.86279296875, 18.201171875, 19.53955078125, 20.8779296875, 22.21630859375, 23.5546875, 24.89306640625, 26.2314453125, 27.56982421875, 28.908203125, 30.24658203125, 31.5849609375, 32.92333984375, 34.26171875, 35.60009765625, 36.9384765625, 38.27685546875, 39.615234375, 40.95361328125, 42.2919921875, 43.63037109375, 44.96875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 14.0, 28.0, 36.0, 67.0, 122.0, 181.0, 338.0, 597.0, 1064.0, 1823.0, 3356.0, 5640.0, 9884.0, 16485.0, 26135.0, 40032.0, 58425.0, 79126.0, 98928.0, 114498.0, 120140.0, 115759.0, 100933.0, 81593.0, 60842.0, 42756.0, 27630.0, 17240.0, 10482.0, 6113.0, 3592.0, 1952.0, 1201.0, 684.0, 362.0, 190.0, 126.0, 75.0, 42.0, 29.0, 16.0, 9.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.139404296875, -18.51318359375, -17.886962890625, -17.2607421875, -16.634521484375, -16.00830078125, -15.382080078125, -14.755859375, -14.129638671875, -13.50341796875, -12.877197265625, -12.2509765625, -11.624755859375, -10.99853515625, -10.372314453125, -9.74609375, -9.119873046875, -8.49365234375, -7.867431640625, -7.2412109375, -6.614990234375, -5.98876953125, -5.362548828125, -4.736328125, -4.110107421875, -3.48388671875, -2.857666015625, -2.2314453125, -1.605224609375, -0.97900390625, -0.352783203125, 0.2734375, 0.899658203125, 1.52587890625, 2.152099609375, 2.7783203125, 3.404541015625, 4.03076171875, 4.656982421875, 5.283203125, 5.909423828125, 6.53564453125, 7.161865234375, 7.7880859375, 8.414306640625, 9.04052734375, 9.666748046875, 10.29296875, 10.919189453125, 11.54541015625, 12.171630859375, 12.7978515625, 13.424072265625, 14.05029296875, 14.676513671875, 15.302734375, 15.928955078125, 16.55517578125, 17.181396484375, 17.8076171875, 18.433837890625, 19.06005859375, 19.686279296875, 20.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 18.0, 11.0, 16.0, 23.0, 21.0, 29.0, 32.0, 34.0, 40.0, 40.0, 59.0, 43.0, 60.0, 52.0, 58.0, 45.0, 56.0, 54.0, 44.0, 46.0, 35.0, 28.0, 32.0, 23.0, 12.0, 23.0, 12.0, 14.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023040771484375, -0.0022216439247131348, -0.0021392107009887695, -0.0020567774772644043, -0.001974344253540039, -0.0018919110298156738, -0.0018094778060913086, -0.0017270445823669434, -0.0016446113586425781, -0.0015621781349182129, -0.0014797449111938477, -0.0013973116874694824, -0.0013148784637451172, -0.001232445240020752, -0.0011500120162963867, -0.0010675787925720215, -0.0009851455688476562, -0.000902712345123291, -0.0008202791213989258, -0.0007378458976745605, -0.0006554126739501953, -0.0005729794502258301, -0.0004905462265014648, -0.0004081130027770996, -0.0003256797790527344, -0.00024324655532836914, -0.0001608133316040039, -7.838010787963867e-05, 4.0531158447265625e-06, 8.64863395690918e-05, 0.00016891956329345703, 0.00025135278701782227, 0.0003337860107421875, 0.00041621923446655273, 0.000498652458190918, 0.0005810856819152832, 0.0006635189056396484, 0.0007459521293640137, 0.0008283853530883789, 0.0009108185768127441, 0.0009932518005371094, 0.0010756850242614746, 0.0011581182479858398, 0.001240551471710205, 0.0013229846954345703, 0.0014054179191589355, 0.0014878511428833008, 0.001570284366607666, 0.0016527175903320312, 0.0017351508140563965, 0.0018175840377807617, 0.001900017261505127, 0.001982450485229492, 0.0020648837089538574, 0.0021473169326782227, 0.002229750156402588, 0.002312183380126953, 0.0023946166038513184, 0.0024770498275756836, 0.002559483051300049, 0.002641916275024414, 0.0027243494987487793, 0.0028067827224731445, 0.0028892159461975098, 0.002971649169921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 14.0, 12.0, 19.0, 35.0, 73.0, 106.0, 155.0, 297.0, 477.0, 818.0, 1395.0, 2105.0, 3429.0, 5541.0, 8760.0, 13368.0, 20435.0, 29650.0, 41667.0, 56821.0, 71856.0, 87974.0, 99269.0, 105014.0, 102913.0, 94723.0, 80537.0, 64981.0, 49087.0, 35965.0, 24985.0, 16607.0, 10980.0, 6953.0, 4341.0, 2754.0, 1695.0, 1091.0, 649.0, 425.0, 222.0, 144.0, 100.0, 43.0, 28.0, 14.0, 8.0, 8.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.453125, -19.828857421875, -19.20458984375, -18.580322265625, -17.9560546875, -17.331787109375, -16.70751953125, -16.083251953125, -15.458984375, -14.834716796875, -14.21044921875, -13.586181640625, -12.9619140625, -12.337646484375, -11.71337890625, -11.089111328125, -10.46484375, -9.840576171875, -9.21630859375, -8.592041015625, -7.9677734375, -7.343505859375, -6.71923828125, -6.094970703125, -5.470703125, -4.846435546875, -4.22216796875, -3.597900390625, -2.9736328125, -2.349365234375, -1.72509765625, -1.100830078125, -0.4765625, 0.147705078125, 0.77197265625, 1.396240234375, 2.0205078125, 2.644775390625, 3.26904296875, 3.893310546875, 4.517578125, 5.141845703125, 5.76611328125, 6.390380859375, 7.0146484375, 7.638916015625, 8.26318359375, 8.887451171875, 9.51171875, 10.135986328125, 10.76025390625, 11.384521484375, 12.0087890625, 12.633056640625, 13.25732421875, 13.881591796875, 14.505859375, 15.130126953125, 15.75439453125, 16.378662109375, 17.0029296875, 17.627197265625, 18.25146484375, 18.875732421875, 19.5]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 7.0, 10.0, 12.0, 14.0, 10.0, 20.0, 23.0, 16.0, 21.0, 30.0, 29.0, 38.0, 36.0, 30.0, 32.0, 41.0, 59.0, 50.0, 62.0, 53.0, 44.0, 37.0, 38.0, 43.0, 51.0, 30.0, 30.0, 27.0, 11.0, 17.0, 15.0, 10.0, 6.0, 4.0, 8.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0638427734375, -8.760498046875, -8.4571533203125, -8.15380859375, -7.8504638671875, -7.547119140625, -7.2437744140625, -6.9404296875, -6.6370849609375, -6.333740234375, -6.0303955078125, -5.72705078125, -5.4237060546875, -5.120361328125, -4.8170166015625, -4.513671875, -4.2103271484375, -3.906982421875, -3.6036376953125, -3.30029296875, -2.9969482421875, -2.693603515625, -2.3902587890625, -2.0869140625, -1.7835693359375, -1.480224609375, -1.1768798828125, -0.87353515625, -0.5701904296875, -0.266845703125, 0.0364990234375, 0.33984375, 0.6431884765625, 0.946533203125, 1.2498779296875, 1.55322265625, 1.8565673828125, 2.159912109375, 2.4632568359375, 2.7666015625, 3.0699462890625, 3.373291015625, 3.6766357421875, 3.97998046875, 4.2833251953125, 4.586669921875, 4.8900146484375, 5.193359375, 5.4967041015625, 5.800048828125, 6.1033935546875, 6.40673828125, 6.7100830078125, 7.013427734375, 7.3167724609375, 7.6201171875, 7.9234619140625, 8.226806640625, 8.5301513671875, 8.83349609375, 9.1368408203125, 9.440185546875, 9.7435302734375, 10.046875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 9.0, 17.0, 15.0, 13.0, 15.0, 22.0, 22.0, 18.0, 36.0, 35.0, 32.0, 33.0, 43.0, 48.0, 41.0, 32.0, 40.0, 38.0, 40.0, 51.0, 34.0, 43.0, 29.0, 25.0, 24.0, 24.0, 25.0, 20.0, 17.0, 16.0, 11.0, 19.0, 7.0, 7.0, 10.0, 6.0, 7.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.550498962402344, -51.78920364379883, -50.02790832519531, -48.26660919189453, -46.505313873291016, -44.7440185546875, -42.982723236083984, -41.22142791748047, -39.46012878417969, -37.69883346557617, -35.937538146972656, -34.176239013671875, -32.41494369506836, -30.653648376464844, -28.892353057861328, -27.13105583190918, -25.369760513305664, -23.60846519470215, -21.84716796875, -20.085872650146484, -18.324575424194336, -16.56328010559082, -14.801983833312988, -13.040687561035156, -11.279391288757324, -9.518095016479492, -7.75679874420166, -5.995502948760986, -4.234206676483154, -2.4729108810424805, -0.7116146087646484, 1.0496816635131836, 2.8109779357910156, 4.572274208068848, 6.33357048034668, 8.094865798950195, 9.856163024902344, 11.61745834350586, 13.378754615783691, 15.140050888061523, 16.901348114013672, 18.662643432617188, 20.423940658569336, 22.18523597717285, 23.946533203125, 25.707828521728516, 27.46912384033203, 29.23042106628418, 30.991716384887695, 32.753013610839844, 34.51430892944336, 36.275604248046875, 38.03689956665039, 39.798194885253906, 41.55949401855469, 43.3207893371582, 45.08208465576172, 46.843379974365234, 48.60467529296875, 50.36597442626953, 52.12726974487305, 53.88856506347656, 55.64986038208008, 57.411155700683594, 59.172454833984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 14.0, 16.0, 13.0, 17.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 25.0, 29.0, 39.0, 33.0, 50.0, 42.0, 33.0, 35.0, 41.0, 56.0, 37.0, 36.0, 26.0, 34.0, 33.0, 17.0, 25.0, 31.0, 20.0, 24.0, 21.0, 20.0, 8.0, 11.0, 7.0, 6.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-64.747314453125, -62.61769104003906, -60.488067626953125, -58.35844421386719, -56.22882080078125, -54.09919738769531, -51.96957015991211, -49.83994674682617, -47.710323333740234, -45.5806999206543, -43.45107650756836, -41.32145309448242, -39.19182586669922, -37.06220245361328, -34.932579040527344, -32.802955627441406, -30.67333221435547, -28.54370880126953, -26.414085388183594, -24.284460067749023, -22.154836654663086, -20.02521324157715, -17.895587921142578, -15.76596450805664, -13.636341094970703, -11.506717681884766, -9.377093315124512, -7.247469425201416, -5.11784553527832, -2.988222122192383, -0.8585977554321289, 1.271026611328125, 3.4006423950195312, 5.530266284942627, 7.659890174865723, 9.789514541625977, 11.919137954711914, 14.048761367797852, 16.178386688232422, 18.30801010131836, 20.437633514404297, 22.567256927490234, 24.696880340576172, 26.826505661010742, 28.95612907409668, 31.085752487182617, 33.21537780761719, 35.345001220703125, 37.47462463378906, 39.604248046875, 41.73387145996094, 43.863494873046875, 45.99311828613281, 48.12274169921875, 50.25236892700195, 52.38199234008789, 54.51161575317383, 56.641239166259766, 58.7708625793457, 60.90048599243164, 63.030113220214844, 65.15973663330078, 67.28936004638672, 69.41898345947266, 71.5486068725586]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 11.0, 11.0, 26.0, 21.0, 47.0, 95.0, 179.0, 308.0, 493.0, 862.0, 1508.0, 2542.0, 4451.0, 7285.0, 11939.0, 19476.0, 31068.0, 48196.0, 73790.0, 108174.0, 153667.0, 208669.0, 270833.0, 331629.0, 381947.0, 410741.0, 413483.0, 386163.0, 340370.0, 279901.0, 217450.0, 161440.0, 113742.0, 77355.0, 51429.0, 32780.0, 20434.0, 12770.0, 7775.0, 4653.0, 2692.0, 1638.0, 961.0, 545.0, 299.0, 179.0, 128.0, 47.0, 35.0, 21.0, 12.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.08349609375, -40.6357421875, -39.18798828125, -37.740234375, -36.29248046875, -34.8447265625, -33.39697265625, -31.94921875, -30.50146484375, -29.0537109375, -27.60595703125, -26.158203125, -24.71044921875, -23.2626953125, -21.81494140625, -20.3671875, -18.91943359375, -17.4716796875, -16.02392578125, -14.576171875, -13.12841796875, -11.6806640625, -10.23291015625, -8.78515625, -7.33740234375, -5.8896484375, -4.44189453125, -2.994140625, -1.54638671875, -0.0986328125, 1.34912109375, 2.796875, 4.24462890625, 5.6923828125, 7.14013671875, 8.587890625, 10.03564453125, 11.4833984375, 12.93115234375, 14.37890625, 15.82666015625, 17.2744140625, 18.72216796875, 20.169921875, 21.61767578125, 23.0654296875, 24.51318359375, 25.9609375, 27.40869140625, 28.8564453125, 30.30419921875, 31.751953125, 33.19970703125, 34.6474609375, 36.09521484375, 37.54296875, 38.99072265625, 40.4384765625, 41.88623046875, 43.333984375, 44.78173828125, 46.2294921875, 47.67724609375, 49.125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 6.0, 7.0, 16.0, 15.0, 17.0, 17.0, 22.0, 14.0, 25.0, 24.0, 28.0, 25.0, 25.0, 36.0, 36.0, 38.0, 43.0, 43.0, 29.0, 33.0, 46.0, 52.0, 45.0, 29.0, 25.0, 31.0, 32.0, 26.0, 24.0, 24.0, 24.0, 22.0, 24.0, 16.0, 14.0, 8.0, 7.0, 7.0, 6.0, 9.0, 2.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-58.53125, -56.60009765625, -54.6689453125, -52.73779296875, -50.806640625, -48.87548828125, -46.9443359375, -45.01318359375, -43.08203125, -41.15087890625, -39.2197265625, -37.28857421875, -35.357421875, -33.42626953125, -31.4951171875, -29.56396484375, -27.6328125, -25.70166015625, -23.7705078125, -21.83935546875, -19.908203125, -17.97705078125, -16.0458984375, -14.11474609375, -12.18359375, -10.25244140625, -8.3212890625, -6.39013671875, -4.458984375, -2.52783203125, -0.5966796875, 1.33447265625, 3.265625, 5.19677734375, 7.1279296875, 9.05908203125, 10.990234375, 12.92138671875, 14.8525390625, 16.78369140625, 18.71484375, 20.64599609375, 22.5771484375, 24.50830078125, 26.439453125, 28.37060546875, 30.3017578125, 32.23291015625, 34.1640625, 36.09521484375, 38.0263671875, 39.95751953125, 41.888671875, 43.81982421875, 45.7509765625, 47.68212890625, 49.61328125, 51.54443359375, 53.4755859375, 55.40673828125, 57.337890625, 59.26904296875, 61.2001953125, 63.13134765625, 65.0625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 11.0, 20.0, 41.0, 74.0, 143.0, 225.0, 396.0, 651.0, 1145.0, 1898.0, 3292.0, 5403.0, 8824.0, 13956.0, 22272.0, 34693.0, 51958.0, 76222.0, 107770.0, 147345.0, 193712.0, 245097.0, 294054.0, 336604.0, 365759.0, 376040.0, 364859.0, 336058.0, 293649.0, 244975.0, 193072.0, 147245.0, 106742.0, 75223.0, 51907.0, 34520.0, 22245.0, 14099.0, 8765.0, 5353.0, 3286.0, 1920.0, 1157.0, 656.0, 385.0, 230.0, 132.0, 84.0, 47.0, 32.0, 19.0, 14.0, 3.0, 1.0, 3.0], "bins": [-48.84375, -47.427734375, -46.01171875, -44.595703125, -43.1796875, -41.763671875, -40.34765625, -38.931640625, -37.515625, -36.099609375, -34.68359375, -33.267578125, -31.8515625, -30.435546875, -29.01953125, -27.603515625, -26.1875, -24.771484375, -23.35546875, -21.939453125, -20.5234375, -19.107421875, -17.69140625, -16.275390625, -14.859375, -13.443359375, -12.02734375, -10.611328125, -9.1953125, -7.779296875, -6.36328125, -4.947265625, -3.53125, -2.115234375, -0.69921875, 0.716796875, 2.1328125, 3.548828125, 4.96484375, 6.380859375, 7.796875, 9.212890625, 10.62890625, 12.044921875, 13.4609375, 14.876953125, 16.29296875, 17.708984375, 19.125, 20.541015625, 21.95703125, 23.373046875, 24.7890625, 26.205078125, 27.62109375, 29.037109375, 30.453125, 31.869140625, 33.28515625, 34.701171875, 36.1171875, 37.533203125, 38.94921875, 40.365234375, 41.78125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 5.0, 16.0, 9.0, 15.0, 17.0, 30.0, 29.0, 32.0, 39.0, 55.0, 64.0, 80.0, 84.0, 119.0, 117.0, 126.0, 130.0, 157.0, 158.0, 178.0, 170.0, 199.0, 200.0, 178.0, 153.0, 178.0, 159.0, 184.0, 145.0, 153.0, 114.0, 130.0, 98.0, 73.0, 69.0, 76.0, 65.0, 43.0, 42.0, 32.0, 29.0, 34.0, 24.0, 21.0, 9.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.96875, -24.1494140625, -23.330078125, -22.5107421875, -21.69140625, -20.8720703125, -20.052734375, -19.2333984375, -18.4140625, -17.5947265625, -16.775390625, -15.9560546875, -15.13671875, -14.3173828125, -13.498046875, -12.6787109375, -11.859375, -11.0400390625, -10.220703125, -9.4013671875, -8.58203125, -7.7626953125, -6.943359375, -6.1240234375, -5.3046875, -4.4853515625, -3.666015625, -2.8466796875, -2.02734375, -1.2080078125, -0.388671875, 0.4306640625, 1.25, 2.0693359375, 2.888671875, 3.7080078125, 4.52734375, 5.3466796875, 6.166015625, 6.9853515625, 7.8046875, 8.6240234375, 9.443359375, 10.2626953125, 11.08203125, 11.9013671875, 12.720703125, 13.5400390625, 14.359375, 15.1787109375, 15.998046875, 16.8173828125, 17.63671875, 18.4560546875, 19.275390625, 20.0947265625, 20.9140625, 21.7333984375, 22.552734375, 23.3720703125, 24.19140625, 25.0107421875, 25.830078125, 26.6494140625, 27.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 11.0, 18.0, 18.0, 20.0, 16.0, 21.0, 20.0, 28.0, 27.0, 36.0, 38.0, 41.0, 44.0, 54.0, 63.0, 44.0, 42.0, 44.0, 58.0, 33.0, 40.0, 28.0, 27.0, 31.0, 30.0, 22.0, 19.0, 22.0, 14.0, 9.0, 8.0, 7.0, 6.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-78.44146728515625, -76.33866882324219, -74.23587036132812, -72.1330795288086, -70.03028106689453, -67.92748260498047, -65.8246841430664, -63.721885681152344, -61.61909103393555, -59.516292572021484, -57.41349792480469, -55.310699462890625, -53.20790100097656, -51.105106353759766, -49.0023078918457, -46.899513244628906, -44.796714782714844, -42.69391632080078, -40.591121673583984, -38.48832321166992, -36.385528564453125, -34.28273010253906, -32.179931640625, -30.07713508605957, -27.97433853149414, -25.87154197692871, -23.76874542236328, -21.66594696044922, -19.56315040588379, -17.46035385131836, -15.357556343078613, -13.254758834838867, -11.151966094970703, -9.049169540405273, -6.946372032165527, -4.8435750007629395, -2.7407779693603516, -0.6379814147949219, 1.4648160934448242, 3.5676136016845703, 5.67041015625, 7.773207187652588, 9.876004219055176, 11.978801727294922, 14.081598281860352, 16.18439483642578, 18.287193298339844, 20.389989852905273, 22.492786407470703, 24.595582962036133, 26.698379516601562, 28.801177978515625, 30.903974533081055, 33.006771087646484, 35.10956954956055, 37.212364196777344, 39.315162658691406, 41.41796112060547, 43.520755767822266, 45.62355422973633, 47.726348876953125, 49.82914733886719, 51.93194580078125, 54.03474426269531, 56.13753890991211]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 8.0, 7.0, 5.0, 13.0, 17.0, 19.0, 16.0, 23.0, 20.0, 32.0, 30.0, 25.0, 41.0, 32.0, 23.0, 48.0, 42.0, 43.0, 44.0, 44.0, 43.0, 47.0, 52.0, 44.0, 34.0, 20.0, 28.0, 40.0, 25.0, 22.0, 19.0, 18.0, 13.0, 13.0, 3.0, 17.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.32952117919922, -70.92608642578125, -68.52265167236328, -66.11920928955078, -63.71577453613281, -61.312339782714844, -58.908905029296875, -56.505470275878906, -54.10203170776367, -51.6985969543457, -49.29515838623047, -46.8917236328125, -44.48828887939453, -42.0848503112793, -39.68141555786133, -37.277976989746094, -34.874542236328125, -32.471107482910156, -30.067668914794922, -27.664234161376953, -25.26079750061035, -22.85736083984375, -20.45392608642578, -18.05048942565918, -15.647052764892578, -13.243616104125977, -10.840180397033691, -8.436744689941406, -6.033308029174805, -3.629871368408203, -1.226435661315918, 1.1770000457763672, 3.5804367065429688, 5.983872890472412, 8.387309074401855, 10.79074478149414, 13.194181442260742, 15.597618103027344, 18.001052856445312, 20.404489517211914, 22.807926177978516, 25.211362838745117, 27.61479949951172, 30.018234252929688, 32.421669006347656, 34.82510757446289, 37.22854232788086, 39.631980895996094, 42.03541564941406, 44.43885040283203, 46.842288970947266, 49.245723724365234, 51.64916229248047, 54.05259704589844, 56.456031799316406, 58.859466552734375, 61.26290512084961, 63.66633987426758, 66.06977844238281, 68.47321319580078, 70.87664794921875, 73.28009033203125, 75.68352508544922, 78.08695983886719, 80.49039459228516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 9.0, 36.0, 39.0, 70.0, 94.0, 150.0, 238.0, 393.0, 568.0, 933.0, 1389.0, 2162.0, 3399.0, 5161.0, 7729.0, 11879.0, 17476.0, 25554.0, 36840.0, 50749.0, 66423.0, 84545.0, 99853.0, 108293.0, 108470.0, 99757.0, 85001.0, 66995.0, 50568.0, 36464.0, 25627.0, 17374.0, 11874.0, 7808.0, 4899.0, 3364.0, 2227.0, 1462.0, 918.0, 592.0, 364.0, 254.0, 183.0, 114.0, 83.0, 51.0, 32.0, 19.0, 20.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-8.390625, -8.12841796875, -7.8662109375, -7.60400390625, -7.341796875, -7.07958984375, -6.8173828125, -6.55517578125, -6.29296875, -6.03076171875, -5.7685546875, -5.50634765625, -5.244140625, -4.98193359375, -4.7197265625, -4.45751953125, -4.1953125, -3.93310546875, -3.6708984375, -3.40869140625, -3.146484375, -2.88427734375, -2.6220703125, -2.35986328125, -2.09765625, -1.83544921875, -1.5732421875, -1.31103515625, -1.048828125, -0.78662109375, -0.5244140625, -0.26220703125, 0.0, 0.26220703125, 0.5244140625, 0.78662109375, 1.048828125, 1.31103515625, 1.5732421875, 1.83544921875, 2.09765625, 2.35986328125, 2.6220703125, 2.88427734375, 3.146484375, 3.40869140625, 3.6708984375, 3.93310546875, 4.1953125, 4.45751953125, 4.7197265625, 4.98193359375, 5.244140625, 5.50634765625, 5.7685546875, 6.03076171875, 6.29296875, 6.55517578125, 6.8173828125, 7.07958984375, 7.341796875, 7.60400390625, 7.8662109375, 8.12841796875, 8.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 8.0, 4.0, 13.0, 19.0, 16.0, 17.0, 22.0, 22.0, 30.0, 30.0, 26.0, 41.0, 32.0, 24.0, 48.0, 40.0, 44.0, 46.0, 43.0, 43.0, 47.0, 49.0, 44.0, 35.0, 22.0, 28.0, 37.0, 28.0, 22.0, 19.0, 18.0, 12.0, 13.0, 5.0, 15.0, 4.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.8125, -71.40234375, -68.9921875, -66.58203125, -64.171875, -61.76171875, -59.3515625, -56.94140625, -54.53125, -52.12109375, -49.7109375, -47.30078125, -44.890625, -42.48046875, -40.0703125, -37.66015625, -35.25, -32.83984375, -30.4296875, -28.01953125, -25.609375, -23.19921875, -20.7890625, -18.37890625, -15.96875, -13.55859375, -11.1484375, -8.73828125, -6.328125, -3.91796875, -1.5078125, 0.90234375, 3.3125, 5.72265625, 8.1328125, 10.54296875, 12.953125, 15.36328125, 17.7734375, 20.18359375, 22.59375, 25.00390625, 27.4140625, 29.82421875, 32.234375, 34.64453125, 37.0546875, 39.46484375, 41.875, 44.28515625, 46.6953125, 49.10546875, 51.515625, 53.92578125, 56.3359375, 58.74609375, 61.15625, 63.56640625, 65.9765625, 68.38671875, 70.796875, 73.20703125, 75.6171875, 78.02734375, 80.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 6.0, 10.0, 5.0, 13.0, 17.0, 26.0, 37.0, 57.0, 82.0, 107.0, 171.0, 242.0, 349.0, 471.0, 650.0, 914.0, 1176.0, 1710.0, 2388.0, 3183.0, 4382.0, 6026.0, 8449.0, 11836.0, 17691.0, 30591.0, 203153.0, 623330.0, 58073.0, 22302.0, 14720.0, 10020.0, 7175.0, 5236.0, 3814.0, 2829.0, 2006.0, 1484.0, 1107.0, 779.0, 495.0, 429.0, 315.0, 218.0, 133.0, 95.0, 83.0, 48.0, 45.0, 25.0, 14.0, 17.0, 9.0, 10.0, 1.0, 3.0, 3.0, 3.0], "bins": [-16.109375, -15.625, -15.140625, -14.65625, -14.171875, -13.6875, -13.203125, -12.71875, -12.234375, -11.75, -11.265625, -10.78125, -10.296875, -9.8125, -9.328125, -8.84375, -8.359375, -7.875, -7.390625, -6.90625, -6.421875, -5.9375, -5.453125, -4.96875, -4.484375, -4.0, -3.515625, -3.03125, -2.546875, -2.0625, -1.578125, -1.09375, -0.609375, -0.125, 0.359375, 0.84375, 1.328125, 1.8125, 2.296875, 2.78125, 3.265625, 3.75, 4.234375, 4.71875, 5.203125, 5.6875, 6.171875, 6.65625, 7.140625, 7.625, 8.109375, 8.59375, 9.078125, 9.5625, 10.046875, 10.53125, 11.015625, 11.5, 11.984375, 12.46875, 12.953125, 13.4375, 13.921875, 14.40625, 14.890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 14.0, 14.0, 19.0, 22.0, 23.0, 20.0, 28.0, 26.0, 32.0, 28.0, 34.0, 43.0, 50.0, 58.0, 47.0, 44.0, 39.0, 52.0, 42.0, 37.0, 45.0, 47.0, 25.0, 29.0, 25.0, 21.0, 18.0, 26.0, 12.0, 16.0, 13.0, 14.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.59375, -49.8564453125, -48.119140625, -46.3818359375, -44.64453125, -42.9072265625, -41.169921875, -39.4326171875, -37.6953125, -35.9580078125, -34.220703125, -32.4833984375, -30.74609375, -29.0087890625, -27.271484375, -25.5341796875, -23.796875, -22.0595703125, -20.322265625, -18.5849609375, -16.84765625, -15.1103515625, -13.373046875, -11.6357421875, -9.8984375, -8.1611328125, -6.423828125, -4.6865234375, -2.94921875, -1.2119140625, 0.525390625, 2.2626953125, 4.0, 5.7373046875, 7.474609375, 9.2119140625, 10.94921875, 12.6865234375, 14.423828125, 16.1611328125, 17.8984375, 19.6357421875, 21.373046875, 23.1103515625, 24.84765625, 26.5849609375, 28.322265625, 30.0595703125, 31.796875, 33.5341796875, 35.271484375, 37.0087890625, 38.74609375, 40.4833984375, 42.220703125, 43.9580078125, 45.6953125, 47.4326171875, 49.169921875, 50.9072265625, 52.64453125, 54.3818359375, 56.119140625, 57.8564453125, 59.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 11.0, 11.0, 14.0, 17.0, 31.0, 41.0, 47.0, 78.0, 112.0, 135.0, 235.0, 279.0, 433.0, 627.0, 940.0, 1388.0, 2029.0, 3041.0, 4434.0, 6742.0, 10233.0, 15530.0, 24688.0, 81162.0, 790983.0, 42207.0, 21684.0, 13920.0, 9153.0, 6018.0, 4014.0, 2647.0, 1783.0, 1221.0, 825.0, 529.0, 402.0, 268.0, 166.0, 138.0, 102.0, 57.0, 56.0, 33.0, 33.0, 11.0, 8.0, 11.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.140625, -2.074493408203125, -2.00836181640625, -1.942230224609375, -1.8760986328125, -1.809967041015625, -1.74383544921875, -1.677703857421875, -1.611572265625, -1.545440673828125, -1.47930908203125, -1.413177490234375, -1.3470458984375, -1.280914306640625, -1.21478271484375, -1.148651123046875, -1.08251953125, -1.016387939453125, -0.95025634765625, -0.884124755859375, -0.8179931640625, -0.751861572265625, -0.68572998046875, -0.619598388671875, -0.553466796875, -0.487335205078125, -0.42120361328125, -0.355072021484375, -0.2889404296875, -0.222808837890625, -0.15667724609375, -0.090545654296875, -0.0244140625, 0.041717529296875, 0.10784912109375, 0.173980712890625, 0.2401123046875, 0.306243896484375, 0.37237548828125, 0.438507080078125, 0.504638671875, 0.570770263671875, 0.63690185546875, 0.703033447265625, 0.7691650390625, 0.835296630859375, 0.90142822265625, 0.967559814453125, 1.03369140625, 1.099822998046875, 1.16595458984375, 1.232086181640625, 1.2982177734375, 1.364349365234375, 1.43048095703125, 1.496612548828125, 1.562744140625, 1.628875732421875, 1.69500732421875, 1.761138916015625, 1.8272705078125, 1.893402099609375, 1.95953369140625, 2.025665283203125, 2.091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 10.0, 19.0, 14.0, 20.0, 14.0, 21.0, 28.0, 17.0, 35.0, 31.0, 38.0, 33.0, 51.0, 56.0, 35.0, 40.0, 49.0, 41.0, 54.0, 46.0, 36.0, 35.0, 39.0, 40.0, 31.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 11.0, 3.0, 9.0, 1.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-7.224082946777344e-05, -7.024593651294708e-05, -6.825104355812073e-05, -6.625615060329437e-05, -6.426125764846802e-05, -6.226636469364166e-05, -6.027147173881531e-05, -5.827657878398895e-05, -5.62816858291626e-05, -5.428679287433624e-05, -5.229189991950989e-05, -5.029700696468353e-05, -4.830211400985718e-05, -4.630722105503082e-05, -4.431232810020447e-05, -4.231743514537811e-05, -4.032254219055176e-05, -3.83276492357254e-05, -3.633275628089905e-05, -3.433786332607269e-05, -3.234297037124634e-05, -3.0348077416419983e-05, -2.8353184461593628e-05, -2.6358291506767273e-05, -2.4363398551940918e-05, -2.2368505597114563e-05, -2.0373612642288208e-05, -1.8378719687461853e-05, -1.6383826732635498e-05, -1.4388933777809143e-05, -1.2394040822982788e-05, -1.0399147868156433e-05, -8.404254913330078e-06, -6.409361958503723e-06, -4.414469003677368e-06, -2.419576048851013e-06, -4.246830940246582e-07, 1.5702098608016968e-06, 3.5651028156280518e-06, 5.559995770454407e-06, 7.554888725280762e-06, 9.549781680107117e-06, 1.1544674634933472e-05, 1.3539567589759827e-05, 1.553446054458618e-05, 1.7529353499412537e-05, 1.952424645423889e-05, 2.1519139409065247e-05, 2.35140323638916e-05, 2.5508925318717957e-05, 2.750381827354431e-05, 2.9498711228370667e-05, 3.149360418319702e-05, 3.3488497138023376e-05, 3.548339009284973e-05, 3.7478283047676086e-05, 3.947317600250244e-05, 4.1468068957328796e-05, 4.346296191215515e-05, 4.5457854866981506e-05, 4.745274782180786e-05, 4.9447640776634216e-05, 5.144253373146057e-05, 5.3437426686286926e-05, 5.543231964111328e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 11.0, 12.0, 18.0, 48.0, 45.0, 83.0, 118.0, 161.0, 238.0, 373.0, 526.0, 755.0, 1140.0, 1624.0, 2391.0, 3278.0, 4897.0, 6848.0, 9652.0, 14233.0, 19534.0, 27555.0, 38876.0, 52906.0, 70803.0, 91497.0, 110773.0, 119125.0, 112220.0, 93968.0, 73139.0, 54603.0, 40099.0, 28479.0, 20639.0, 14438.0, 10174.0, 7190.0, 4893.0, 3426.0, 2365.0, 1687.0, 1142.0, 809.0, 569.0, 411.0, 257.0, 198.0, 117.0, 91.0, 45.0, 40.0, 13.0, 19.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6256561279296875, -1.570648193359375, -1.5156402587890625, -1.46063232421875, -1.4056243896484375, -1.350616455078125, -1.2956085205078125, -1.2406005859375, -1.1855926513671875, -1.130584716796875, -1.0755767822265625, -1.02056884765625, -0.9655609130859375, -0.910552978515625, -0.8555450439453125, -0.800537109375, -0.7455291748046875, -0.690521240234375, -0.6355133056640625, -0.58050537109375, -0.5254974365234375, -0.470489501953125, -0.4154815673828125, -0.3604736328125, -0.3054656982421875, -0.250457763671875, -0.1954498291015625, -0.14044189453125, -0.0854339599609375, -0.030426025390625, 0.0245819091796875, 0.07958984375, 0.1345977783203125, 0.189605712890625, 0.2446136474609375, 0.29962158203125, 0.3546295166015625, 0.409637451171875, 0.4646453857421875, 0.5196533203125, 0.5746612548828125, 0.629669189453125, 0.6846771240234375, 0.73968505859375, 0.7946929931640625, 0.849700927734375, 0.9047088623046875, 0.959716796875, 1.0147247314453125, 1.069732666015625, 1.1247406005859375, 1.17974853515625, 1.2347564697265625, 1.289764404296875, 1.3447723388671875, 1.3997802734375, 1.4547882080078125, 1.509796142578125, 1.5648040771484375, 1.61981201171875, 1.6748199462890625, 1.729827880859375, 1.7848358154296875, 1.83984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 3.0, 12.0, 16.0, 10.0, 23.0, 30.0, 27.0, 40.0, 55.0, 32.0, 48.0, 60.0, 89.0, 89.0, 72.0, 46.0, 45.0, 38.0, 40.0, 33.0, 30.0, 24.0, 30.0, 18.0, 11.0, 9.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1164093017578125, -1.073638916015625, -1.0308685302734375, -0.98809814453125, -0.9453277587890625, -0.902557373046875, -0.8597869873046875, -0.8170166015625, -0.7742462158203125, -0.731475830078125, -0.6887054443359375, -0.64593505859375, -0.6031646728515625, -0.560394287109375, -0.5176239013671875, -0.474853515625, -0.4320831298828125, -0.389312744140625, -0.3465423583984375, -0.30377197265625, -0.2610015869140625, -0.218231201171875, -0.1754608154296875, -0.1326904296875, -0.0899200439453125, -0.047149658203125, -0.0043792724609375, 0.03839111328125, 0.0811614990234375, 0.123931884765625, 0.1667022705078125, 0.20947265625, 0.2522430419921875, 0.295013427734375, 0.3377838134765625, 0.38055419921875, 0.4233245849609375, 0.466094970703125, 0.5088653564453125, 0.5516357421875, 0.5944061279296875, 0.637176513671875, 0.6799468994140625, 0.72271728515625, 0.7654876708984375, 0.808258056640625, 0.8510284423828125, 0.893798828125, 0.9365692138671875, 0.979339599609375, 1.0221099853515625, 1.06488037109375, 1.1076507568359375, 1.150421142578125, 1.1931915283203125, 1.2359619140625, 1.2787322998046875, 1.321502685546875, 1.3642730712890625, 1.40704345703125, 1.4498138427734375, 1.492584228515625, 1.5353546142578125, 1.578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 11.0, 23.0, 17.0, 17.0, 21.0, 19.0, 24.0, 21.0, 34.0, 39.0, 36.0, 43.0, 46.0, 56.0, 55.0, 49.0, 38.0, 50.0, 51.0, 37.0, 37.0, 30.0, 35.0, 25.0, 23.0, 25.0, 22.0, 14.0, 12.0, 11.0, 10.0, 3.0, 6.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-79.88013458251953, -77.76766967773438, -75.65519714355469, -73.54273223876953, -71.43026733398438, -69.31780242919922, -67.20533752441406, -65.09286499023438, -62.98040008544922, -60.86793518066406, -58.75546646118164, -56.64299774169922, -54.53053283691406, -52.418067932128906, -50.305599212646484, -48.19313049316406, -46.080665588378906, -43.96820068359375, -41.85573196411133, -39.743263244628906, -37.63079833984375, -35.518333435058594, -33.40586471557617, -31.293397903442383, -29.180931091308594, -27.068464279174805, -24.955997467041016, -22.843530654907227, -20.731063842773438, -18.61859703063965, -16.50613021850586, -14.39366340637207, -12.281192779541016, -10.168725967407227, -8.056259155273438, -5.943792343139648, -3.8313255310058594, -1.7188587188720703, 0.39360809326171875, 2.506074905395508, 4.618541717529297, 6.731008529663086, 8.843475341796875, 10.955942153930664, 13.068408966064453, 15.180875778198242, 17.29334259033203, 19.40580940246582, 21.51827621459961, 23.6307430267334, 25.743209838867188, 27.855676651000977, 29.968143463134766, 32.08061218261719, 34.193077087402344, 36.3055419921875, 38.41801071166992, 40.530479431152344, 42.6429443359375, 44.755409240722656, 46.86787796020508, 48.9803466796875, 51.092811584472656, 53.20527648925781, 55.317745208740234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 12.0, 7.0, 5.0, 6.0, 12.0, 20.0, 16.0, 16.0, 27.0, 20.0, 36.0, 25.0, 24.0, 42.0, 29.0, 27.0, 45.0, 46.0, 40.0, 49.0, 40.0, 42.0, 48.0, 54.0, 42.0, 32.0, 24.0, 26.0, 37.0, 27.0, 22.0, 17.0, 21.0, 12.0, 11.0, 5.0, 15.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.3089828491211, -70.90727996826172, -68.50557708740234, -66.10387420654297, -63.70217514038086, -61.300472259521484, -58.89876937866211, -56.4970703125, -54.095367431640625, -51.69366455078125, -49.291961669921875, -46.8902587890625, -44.48855972290039, -42.086856842041016, -39.68515396118164, -37.28345489501953, -34.88174819946289, -32.480045318603516, -30.078344345092773, -27.6766414642334, -25.274940490722656, -22.87323760986328, -20.471534729003906, -18.069833755493164, -15.668130874633789, -13.26642894744873, -10.864727020263672, -8.463024139404297, -6.061322212219238, -3.6596202850341797, -1.2579174041748047, 1.1437835693359375, 3.5454864501953125, 5.947188377380371, 8.34889030456543, 10.750593185424805, 13.152295112609863, 15.553997039794922, 17.955699920654297, 20.35740089416504, 22.759103775024414, 25.16080665588379, 27.56250762939453, 29.964210510253906, 32.36591339111328, 34.767616271972656, 37.16931915283203, 39.57101821899414, 41.972721099853516, 44.37442398071289, 46.776126861572266, 49.177825927734375, 51.57952880859375, 53.981231689453125, 56.3829345703125, 58.784637451171875, 61.18634033203125, 63.588043212890625, 65.98974609375, 68.39144897460938, 70.79315185546875, 73.19485473632812, 75.5965576171875, 77.99825286865234, 80.39995574951172]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 9.0, 11.0, 9.0, 24.0, 55.0, 68.0, 115.0, 183.0, 337.0, 571.0, 952.0, 1479.0, 2392.0, 3854.0, 5967.0, 9128.0, 13696.0, 19649.0, 27743.0, 37418.0, 48445.0, 60860.0, 72988.0, 82096.0, 89519.0, 92336.0, 89942.0, 82454.0, 72746.0, 61235.0, 48627.0, 37195.0, 27898.0, 19510.0, 13666.0, 9235.0, 5798.0, 3930.0, 2392.0, 1568.0, 965.0, 625.0, 345.0, 220.0, 127.0, 67.0, 52.0, 26.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.71875, -37.48974609375, -36.2607421875, -35.03173828125, -33.802734375, -32.57373046875, -31.3447265625, -30.11572265625, -28.88671875, -27.65771484375, -26.4287109375, -25.19970703125, -23.970703125, -22.74169921875, -21.5126953125, -20.28369140625, -19.0546875, -17.82568359375, -16.5966796875, -15.36767578125, -14.138671875, -12.90966796875, -11.6806640625, -10.45166015625, -9.22265625, -7.99365234375, -6.7646484375, -5.53564453125, -4.306640625, -3.07763671875, -1.8486328125, -0.61962890625, 0.609375, 1.83837890625, 3.0673828125, 4.29638671875, 5.525390625, 6.75439453125, 7.9833984375, 9.21240234375, 10.44140625, 11.67041015625, 12.8994140625, 14.12841796875, 15.357421875, 16.58642578125, 17.8154296875, 19.04443359375, 20.2734375, 21.50244140625, 22.7314453125, 23.96044921875, 25.189453125, 26.41845703125, 27.6474609375, 28.87646484375, 30.10546875, 31.33447265625, 32.5634765625, 33.79248046875, 35.021484375, 36.25048828125, 37.4794921875, 38.70849609375, 39.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 7.0, 6.0, 9.0, 9.0, 18.0, 19.0, 18.0, 23.0, 21.0, 33.0, 25.0, 27.0, 40.0, 31.0, 28.0, 43.0, 45.0, 39.0, 52.0, 40.0, 46.0, 45.0, 53.0, 45.0, 29.0, 23.0, 26.0, 36.0, 30.0, 21.0, 19.0, 18.0, 12.0, 11.0, 6.0, 14.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.1875, -68.8564453125, -66.525390625, -64.1943359375, -61.86328125, -59.5322265625, -57.201171875, -54.8701171875, -52.5390625, -50.2080078125, -47.876953125, -45.5458984375, -43.21484375, -40.8837890625, -38.552734375, -36.2216796875, -33.890625, -31.5595703125, -29.228515625, -26.8974609375, -24.56640625, -22.2353515625, -19.904296875, -17.5732421875, -15.2421875, -12.9111328125, -10.580078125, -8.2490234375, -5.91796875, -3.5869140625, -1.255859375, 1.0751953125, 3.40625, 5.7373046875, 8.068359375, 10.3994140625, 12.73046875, 15.0615234375, 17.392578125, 19.7236328125, 22.0546875, 24.3857421875, 26.716796875, 29.0478515625, 31.37890625, 33.7099609375, 36.041015625, 38.3720703125, 40.703125, 43.0341796875, 45.365234375, 47.6962890625, 50.02734375, 52.3583984375, 54.689453125, 57.0205078125, 59.3515625, 61.6826171875, 64.013671875, 66.3447265625, 68.67578125, 71.0068359375, 73.337890625, 75.6689453125, 78.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 14.0, 15.0, 41.0, 67.0, 91.0, 154.0, 276.0, 423.0, 748.0, 1147.0, 1781.0, 2779.0, 4241.0, 6414.0, 9390.0, 13677.0, 19098.0, 26237.0, 34481.0, 44099.0, 54667.0, 64576.0, 73652.0, 80603.0, 83704.0, 84224.0, 81180.0, 74144.0, 65097.0, 54839.0, 44215.0, 35244.0, 26326.0, 19321.0, 13565.0, 9597.0, 6449.0, 4356.0, 2801.0, 1846.0, 1186.0, 718.0, 436.0, 261.0, 160.0, 88.0, 62.0, 26.0, 27.0, 11.0, 2.0, 7.0, 0.0, 2.0, 1.0], "bins": [-37.96875, -36.8525390625, -35.736328125, -34.6201171875, -33.50390625, -32.3876953125, -31.271484375, -30.1552734375, -29.0390625, -27.9228515625, -26.806640625, -25.6904296875, -24.57421875, -23.4580078125, -22.341796875, -21.2255859375, -20.109375, -18.9931640625, -17.876953125, -16.7607421875, -15.64453125, -14.5283203125, -13.412109375, -12.2958984375, -11.1796875, -10.0634765625, -8.947265625, -7.8310546875, -6.71484375, -5.5986328125, -4.482421875, -3.3662109375, -2.25, -1.1337890625, -0.017578125, 1.0986328125, 2.21484375, 3.3310546875, 4.447265625, 5.5634765625, 6.6796875, 7.7958984375, 8.912109375, 10.0283203125, 11.14453125, 12.2607421875, 13.376953125, 14.4931640625, 15.609375, 16.7255859375, 17.841796875, 18.9580078125, 20.07421875, 21.1904296875, 22.306640625, 23.4228515625, 24.5390625, 25.6552734375, 26.771484375, 27.8876953125, 29.00390625, 30.1201171875, 31.236328125, 32.3525390625, 33.46875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 16.0, 9.0, 8.0, 22.0, 16.0, 17.0, 29.0, 27.0, 28.0, 26.0, 29.0, 31.0, 37.0, 57.0, 41.0, 42.0, 47.0, 50.0, 44.0, 39.0, 53.0, 34.0, 37.0, 31.0, 37.0, 21.0, 33.0, 23.0, 22.0, 13.0, 18.0, 17.0, 7.0, 11.0, 6.0, 7.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5, -50.814453125, -49.12890625, -47.443359375, -45.7578125, -44.072265625, -42.38671875, -40.701171875, -39.015625, -37.330078125, -35.64453125, -33.958984375, -32.2734375, -30.587890625, -28.90234375, -27.216796875, -25.53125, -23.845703125, -22.16015625, -20.474609375, -18.7890625, -17.103515625, -15.41796875, -13.732421875, -12.046875, -10.361328125, -8.67578125, -6.990234375, -5.3046875, -3.619140625, -1.93359375, -0.248046875, 1.4375, 3.123046875, 4.80859375, 6.494140625, 8.1796875, 9.865234375, 11.55078125, 13.236328125, 14.921875, 16.607421875, 18.29296875, 19.978515625, 21.6640625, 23.349609375, 25.03515625, 26.720703125, 28.40625, 30.091796875, 31.77734375, 33.462890625, 35.1484375, 36.833984375, 38.51953125, 40.205078125, 41.890625, 43.576171875, 45.26171875, 46.947265625, 48.6328125, 50.318359375, 52.00390625, 53.689453125, 55.375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 6.0, 11.0, 14.0, 23.0, 51.0, 56.0, 82.0, 123.0, 188.0, 318.0, 449.0, 643.0, 969.0, 1493.0, 2151.0, 3158.0, 4590.0, 6668.0, 9513.0, 13259.0, 18157.0, 24046.0, 32623.0, 41651.0, 51072.0, 61334.0, 70438.0, 77668.0, 82003.0, 82957.0, 80404.0, 74972.0, 66021.0, 56546.0, 46274.0, 36882.0, 28336.0, 21183.0, 15552.0, 11294.0, 8034.0, 5517.0, 3831.0, 2558.0, 1781.0, 1224.0, 792.0, 535.0, 379.0, 249.0, 160.0, 132.0, 70.0, 45.0, 33.0, 19.0, 12.0, 9.0, 3.0, 0.0, 4.0], "bins": [-16.6875, -16.170166015625, -15.65283203125, -15.135498046875, -14.6181640625, -14.100830078125, -13.58349609375, -13.066162109375, -12.548828125, -12.031494140625, -11.51416015625, -10.996826171875, -10.4794921875, -9.962158203125, -9.44482421875, -8.927490234375, -8.41015625, -7.892822265625, -7.37548828125, -6.858154296875, -6.3408203125, -5.823486328125, -5.30615234375, -4.788818359375, -4.271484375, -3.754150390625, -3.23681640625, -2.719482421875, -2.2021484375, -1.684814453125, -1.16748046875, -0.650146484375, -0.1328125, 0.384521484375, 0.90185546875, 1.419189453125, 1.9365234375, 2.453857421875, 2.97119140625, 3.488525390625, 4.005859375, 4.523193359375, 5.04052734375, 5.557861328125, 6.0751953125, 6.592529296875, 7.10986328125, 7.627197265625, 8.14453125, 8.661865234375, 9.17919921875, 9.696533203125, 10.2138671875, 10.731201171875, 11.24853515625, 11.765869140625, 12.283203125, 12.800537109375, 13.31787109375, 13.835205078125, 14.3525390625, 14.869873046875, 15.38720703125, 15.904541015625, 16.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 5.0, 14.0, 18.0, 7.0, 9.0, 27.0, 28.0, 31.0, 36.0, 23.0, 63.0, 46.0, 37.0, 46.0, 62.0, 39.0, 51.0, 61.0, 53.0, 42.0, 35.0, 44.0, 32.0, 29.0, 30.0, 21.0, 29.0, 12.0, 11.0, 5.0, 6.0, 9.0, 12.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032806396484375, -0.0031862258911132812, -0.0030918121337890625, -0.0029973983764648438, -0.002902984619140625, -0.0028085708618164062, -0.0027141571044921875, -0.0026197433471679688, -0.00252532958984375, -0.0024309158325195312, -0.0023365020751953125, -0.0022420883178710938, -0.002147674560546875, -0.0020532608032226562, -0.0019588470458984375, -0.0018644332885742188, -0.00177001953125, -0.0016756057739257812, -0.0015811920166015625, -0.0014867782592773438, -0.001392364501953125, -0.0012979507446289062, -0.0012035369873046875, -0.0011091232299804688, -0.00101470947265625, -0.0009202957153320312, -0.0008258819580078125, -0.0007314682006835938, -0.000637054443359375, -0.0005426406860351562, -0.0004482269287109375, -0.00035381317138671875, -0.0002593994140625, -0.00016498565673828125, -7.05718994140625e-05, 2.384185791015625e-05, 0.000118255615234375, 0.00021266937255859375, 0.0003070831298828125, 0.00040149688720703125, 0.00049591064453125, 0.0005903244018554688, 0.0006847381591796875, 0.0007791519165039062, 0.000873565673828125, 0.0009679794311523438, 0.0010623931884765625, 0.0011568069458007812, 0.001251220703125, 0.0013456344604492188, 0.0014400482177734375, 0.0015344619750976562, 0.001628875732421875, 0.0017232894897460938, 0.0018177032470703125, 0.0019121170043945312, 0.00200653076171875, 0.0021009445190429688, 0.0021953582763671875, 0.0022897720336914062, 0.002384185791015625, 0.0024785995483398438, 0.0025730133056640625, 0.0026674270629882812, 0.0027618408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 9.0, 15.0, 24.0, 31.0, 69.0, 94.0, 128.0, 206.0, 340.0, 541.0, 822.0, 1354.0, 2088.0, 3173.0, 4704.0, 7286.0, 10506.0, 15118.0, 21263.0, 29241.0, 38493.0, 49037.0, 60918.0, 72173.0, 81428.0, 86658.0, 88751.0, 86516.0, 79628.0, 70329.0, 59557.0, 47971.0, 37241.0, 27825.0, 20717.0, 14372.0, 10041.0, 6753.0, 4586.0, 2971.0, 2043.0, 1285.0, 830.0, 500.0, 338.0, 230.0, 140.0, 81.0, 54.0, 29.0, 17.0, 17.0, 5.0, 6.0, 1.0, 6.0, 1.0, 3.0], "bins": [-19.6875, -19.08056640625, -18.4736328125, -17.86669921875, -17.259765625, -16.65283203125, -16.0458984375, -15.43896484375, -14.83203125, -14.22509765625, -13.6181640625, -13.01123046875, -12.404296875, -11.79736328125, -11.1904296875, -10.58349609375, -9.9765625, -9.36962890625, -8.7626953125, -8.15576171875, -7.548828125, -6.94189453125, -6.3349609375, -5.72802734375, -5.12109375, -4.51416015625, -3.9072265625, -3.30029296875, -2.693359375, -2.08642578125, -1.4794921875, -0.87255859375, -0.265625, 0.34130859375, 0.9482421875, 1.55517578125, 2.162109375, 2.76904296875, 3.3759765625, 3.98291015625, 4.58984375, 5.19677734375, 5.8037109375, 6.41064453125, 7.017578125, 7.62451171875, 8.2314453125, 8.83837890625, 9.4453125, 10.05224609375, 10.6591796875, 11.26611328125, 11.873046875, 12.47998046875, 13.0869140625, 13.69384765625, 14.30078125, 14.90771484375, 15.5146484375, 16.12158203125, 16.728515625, 17.33544921875, 17.9423828125, 18.54931640625, 19.15625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 7.0, 12.0, 11.0, 14.0, 15.0, 7.0, 28.0, 15.0, 26.0, 31.0, 29.0, 42.0, 36.0, 36.0, 51.0, 42.0, 37.0, 40.0, 55.0, 51.0, 54.0, 37.0, 27.0, 39.0, 33.0, 28.0, 33.0, 24.0, 24.0, 19.0, 15.0, 11.0, 16.0, 8.0, 11.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.503662109375, -10.15576171875, -9.807861328125, -9.4599609375, -9.112060546875, -8.76416015625, -8.416259765625, -8.068359375, -7.720458984375, -7.37255859375, -7.024658203125, -6.6767578125, -6.328857421875, -5.98095703125, -5.633056640625, -5.28515625, -4.937255859375, -4.58935546875, -4.241455078125, -3.8935546875, -3.545654296875, -3.19775390625, -2.849853515625, -2.501953125, -2.154052734375, -1.80615234375, -1.458251953125, -1.1103515625, -0.762451171875, -0.41455078125, -0.066650390625, 0.28125, 0.629150390625, 0.97705078125, 1.324951171875, 1.6728515625, 2.020751953125, 2.36865234375, 2.716552734375, 3.064453125, 3.412353515625, 3.76025390625, 4.108154296875, 4.4560546875, 4.803955078125, 5.15185546875, 5.499755859375, 5.84765625, 6.195556640625, 6.54345703125, 6.891357421875, 7.2392578125, 7.587158203125, 7.93505859375, 8.282958984375, 8.630859375, 8.978759765625, 9.32666015625, 9.674560546875, 10.0224609375, 10.370361328125, 10.71826171875, 11.066162109375, 11.4140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 5.0, 9.0, 12.0, 13.0, 21.0, 18.0, 26.0, 26.0, 33.0, 37.0, 31.0, 28.0, 47.0, 35.0, 36.0, 41.0, 45.0, 51.0, 49.0, 33.0, 38.0, 41.0, 38.0, 29.0, 27.0, 32.0, 19.0, 19.0, 27.0, 14.0, 17.0, 16.0, 12.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-68.19844055175781, -66.23094940185547, -64.26345825195312, -62.295963287353516, -60.32847213745117, -58.36098098754883, -56.39348602294922, -54.425994873046875, -52.45850372314453, -50.49101257324219, -48.523521423339844, -46.556026458740234, -44.58853530883789, -42.62104415893555, -40.65354919433594, -38.686058044433594, -36.71856689453125, -34.751075744628906, -32.78358459472656, -30.816089630126953, -28.84859848022461, -26.881107330322266, -24.91361427307129, -22.946121215820312, -20.97863006591797, -19.011138916015625, -17.04364585876465, -15.076153755187988, -13.108661651611328, -11.141169548034668, -9.173677444458008, -7.206185340881348, -5.238697052001953, -3.271204948425293, -1.3037128448486328, 0.6637792587280273, 2.6312713623046875, 4.598763465881348, 6.566255569458008, 8.533747673034668, 10.501239776611328, 12.468731880187988, 14.436223983764648, 16.403717041015625, 18.37120819091797, 20.338699340820312, 22.30619239807129, 24.273685455322266, 26.24117660522461, 28.208667755126953, 30.17616081237793, 32.143653869628906, 34.11114501953125, 36.078636169433594, 38.04612731933594, 40.01362228393555, 41.98111343383789, 43.948604583740234, 45.916099548339844, 47.88359069824219, 49.85108184814453, 51.818572998046875, 53.78606414794922, 55.75355911254883, 57.72105026245117]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 7.0, 5.0, 15.0, 13.0, 13.0, 10.0, 20.0, 23.0, 24.0, 26.0, 30.0, 26.0, 34.0, 27.0, 27.0, 40.0, 31.0, 37.0, 42.0, 42.0, 35.0, 39.0, 44.0, 36.0, 39.0, 35.0, 36.0, 28.0, 27.0, 32.0, 25.0, 16.0, 13.0, 13.0, 13.0, 9.0, 12.0, 7.0, 8.0, 3.0, 1.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.96417236328125, -69.64633178710938, -67.32849884033203, -65.01065826416016, -62.69282150268555, -60.37498474121094, -58.05714416503906, -55.73930740356445, -53.421470642089844, -51.103633880615234, -48.785797119140625, -46.46795654296875, -44.15011978149414, -41.83228302001953, -39.514442443847656, -37.19660568237305, -34.87876892089844, -32.56093215942383, -30.243093490600586, -27.925254821777344, -25.607418060302734, -23.289581298828125, -20.971742630004883, -18.65390396118164, -16.33606719970703, -14.018229484558105, -11.70039176940918, -9.382554054260254, -7.064716339111328, -4.746878623962402, -2.4290409088134766, -0.11120223999023438, 2.2066421508789062, 4.524479866027832, 6.842317581176758, 9.160155296325684, 11.47799301147461, 13.795830726623535, 16.11366844177246, 18.431507110595703, 20.749343872070312, 23.067180633544922, 25.385019302368164, 27.702857971191406, 30.020694732666016, 32.338531494140625, 34.6563720703125, 36.97420883178711, 39.29204559326172, 41.60988235473633, 43.92771911621094, 46.24555969238281, 48.56339645385742, 50.88123321533203, 53.199073791503906, 55.516910552978516, 57.834747314453125, 60.152584075927734, 62.470420837402344, 64.78826141357422, 67.10609436035156, 69.42393493652344, 71.74177551269531, 74.05961608886719, 76.37744903564453]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 8.0, 9.0, 14.0, 38.0, 37.0, 83.0, 126.0, 216.0, 372.0, 662.0, 1084.0, 1871.0, 2974.0, 5202.0, 8791.0, 14234.0, 23117.0, 37060.0, 57523.0, 87068.0, 128465.0, 179982.0, 243340.0, 308474.0, 367950.0, 409735.0, 424477.0, 410613.0, 369544.0, 309948.0, 245298.0, 182600.0, 129856.0, 88556.0, 58590.0, 37618.0, 23447.0, 14285.0, 8713.0, 5055.0, 3060.0, 1748.0, 1057.0, 586.0, 340.0, 195.0, 100.0, 62.0, 45.0, 20.0, 10.0, 16.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.59375, -46.08349609375, -44.5732421875, -43.06298828125, -41.552734375, -40.04248046875, -38.5322265625, -37.02197265625, -35.51171875, -34.00146484375, -32.4912109375, -30.98095703125, -29.470703125, -27.96044921875, -26.4501953125, -24.93994140625, -23.4296875, -21.91943359375, -20.4091796875, -18.89892578125, -17.388671875, -15.87841796875, -14.3681640625, -12.85791015625, -11.34765625, -9.83740234375, -8.3271484375, -6.81689453125, -5.306640625, -3.79638671875, -2.2861328125, -0.77587890625, 0.734375, 2.24462890625, 3.7548828125, 5.26513671875, 6.775390625, 8.28564453125, 9.7958984375, 11.30615234375, 12.81640625, 14.32666015625, 15.8369140625, 17.34716796875, 18.857421875, 20.36767578125, 21.8779296875, 23.38818359375, 24.8984375, 26.40869140625, 27.9189453125, 29.42919921875, 30.939453125, 32.44970703125, 33.9599609375, 35.47021484375, 36.98046875, 38.49072265625, 40.0009765625, 41.51123046875, 43.021484375, 44.53173828125, 46.0419921875, 47.55224609375, 49.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 7.0, 6.0, 10.0, 15.0, 16.0, 12.0, 15.0, 20.0, 23.0, 27.0, 31.0, 26.0, 33.0, 27.0, 26.0, 31.0, 47.0, 26.0, 40.0, 49.0, 33.0, 39.0, 46.0, 34.0, 36.0, 39.0, 33.0, 33.0, 28.0, 33.0, 24.0, 19.0, 11.0, 15.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 1.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.8310546875, -65.599609375, -63.3681640625, -61.13671875, -58.9052734375, -56.673828125, -54.4423828125, -52.2109375, -49.9794921875, -47.748046875, -45.5166015625, -43.28515625, -41.0537109375, -38.822265625, -36.5908203125, -34.359375, -32.1279296875, -29.896484375, -27.6650390625, -25.43359375, -23.2021484375, -20.970703125, -18.7392578125, -16.5078125, -14.2763671875, -12.044921875, -9.8134765625, -7.58203125, -5.3505859375, -3.119140625, -0.8876953125, 1.34375, 3.5751953125, 5.806640625, 8.0380859375, 10.26953125, 12.5009765625, 14.732421875, 16.9638671875, 19.1953125, 21.4267578125, 23.658203125, 25.8896484375, 28.12109375, 30.3525390625, 32.583984375, 34.8154296875, 37.046875, 39.2783203125, 41.509765625, 43.7412109375, 45.97265625, 48.2041015625, 50.435546875, 52.6669921875, 54.8984375, 57.1298828125, 59.361328125, 61.5927734375, 63.82421875, 66.0556640625, 68.287109375, 70.5185546875, 72.75]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 23.0, 35.0, 55.0, 114.0, 186.0, 368.0, 542.0, 935.0, 1610.0, 2601.0, 4214.0, 6900.0, 10964.0, 16819.0, 26021.0, 38856.0, 57466.0, 82106.0, 114107.0, 152272.0, 196654.0, 243851.0, 288975.0, 327980.0, 353175.0, 361629.0, 352701.0, 326822.0, 286397.0, 241742.0, 192602.0, 150385.0, 111531.0, 80422.0, 55833.0, 38263.0, 25322.0, 16439.0, 10412.0, 6562.0, 4106.0, 2498.0, 1541.0, 907.0, 565.0, 321.0, 208.0, 108.0, 47.0, 50.0, 19.0, 6.0, 4.0, 4.0, 2.0], "bins": [-49.53125, -48.09423828125, -46.6572265625, -45.22021484375, -43.783203125, -42.34619140625, -40.9091796875, -39.47216796875, -38.03515625, -36.59814453125, -35.1611328125, -33.72412109375, -32.287109375, -30.85009765625, -29.4130859375, -27.97607421875, -26.5390625, -25.10205078125, -23.6650390625, -22.22802734375, -20.791015625, -19.35400390625, -17.9169921875, -16.47998046875, -15.04296875, -13.60595703125, -12.1689453125, -10.73193359375, -9.294921875, -7.85791015625, -6.4208984375, -4.98388671875, -3.546875, -2.10986328125, -0.6728515625, 0.76416015625, 2.201171875, 3.63818359375, 5.0751953125, 6.51220703125, 7.94921875, 9.38623046875, 10.8232421875, 12.26025390625, 13.697265625, 15.13427734375, 16.5712890625, 18.00830078125, 19.4453125, 20.88232421875, 22.3193359375, 23.75634765625, 25.193359375, 26.63037109375, 28.0673828125, 29.50439453125, 30.94140625, 32.37841796875, 33.8154296875, 35.25244140625, 36.689453125, 38.12646484375, 39.5634765625, 41.00048828125, 42.4375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 10.0, 21.0, 21.0, 23.0, 28.0, 33.0, 55.0, 68.0, 63.0, 91.0, 92.0, 102.0, 132.0, 141.0, 150.0, 160.0, 155.0, 186.0, 188.0, 190.0, 161.0, 179.0, 185.0, 189.0, 175.0, 189.0, 141.0, 110.0, 136.0, 107.0, 82.0, 91.0, 71.0, 67.0, 55.0, 51.0, 37.0, 28.0, 23.0, 18.0, 8.0, 12.0, 10.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.796875, -28.88916015625, -27.9814453125, -27.07373046875, -26.166015625, -25.25830078125, -24.3505859375, -23.44287109375, -22.53515625, -21.62744140625, -20.7197265625, -19.81201171875, -18.904296875, -17.99658203125, -17.0888671875, -16.18115234375, -15.2734375, -14.36572265625, -13.4580078125, -12.55029296875, -11.642578125, -10.73486328125, -9.8271484375, -8.91943359375, -8.01171875, -7.10400390625, -6.1962890625, -5.28857421875, -4.380859375, -3.47314453125, -2.5654296875, -1.65771484375, -0.75, 0.15771484375, 1.0654296875, 1.97314453125, 2.880859375, 3.78857421875, 4.6962890625, 5.60400390625, 6.51171875, 7.41943359375, 8.3271484375, 9.23486328125, 10.142578125, 11.05029296875, 11.9580078125, 12.86572265625, 13.7734375, 14.68115234375, 15.5888671875, 16.49658203125, 17.404296875, 18.31201171875, 19.2197265625, 20.12744140625, 21.03515625, 21.94287109375, 22.8505859375, 23.75830078125, 24.666015625, 25.57373046875, 26.4814453125, 27.38916015625, 28.296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 4.0, 12.0, 14.0, 12.0, 12.0, 33.0, 16.0, 26.0, 11.0, 27.0, 27.0, 35.0, 30.0, 38.0, 48.0, 40.0, 46.0, 42.0, 41.0, 53.0, 39.0, 29.0, 45.0, 38.0, 40.0, 36.0, 28.0, 23.0, 16.0, 20.0, 20.0, 10.0, 15.0, 11.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.62174987792969, -69.43634796142578, -67.25094604492188, -65.06553649902344, -62.88013458251953, -60.694732666015625, -58.50933074951172, -56.32392883300781, -54.13852310180664, -51.953121185302734, -49.76771545410156, -47.582313537597656, -45.39691162109375, -43.21150588989258, -41.02610397338867, -38.8406982421875, -36.655296325683594, -34.46989440917969, -32.284488677978516, -30.09908676147461, -27.91368293762207, -25.72827911376953, -23.542877197265625, -21.357473373413086, -19.172069549560547, -16.986665725708008, -14.801262855529785, -12.615859985351562, -10.430456161499023, -8.245052337646484, -6.059649467468262, -3.874246597290039, -1.6888351440429688, 0.4965682029724121, 2.681971549987793, 4.867374897003174, 7.052778244018555, 9.238182067871094, 11.423584938049316, 13.608987808227539, 15.794391632080078, 17.979795455932617, 20.165199279785156, 22.350601196289062, 24.5360050201416, 26.72140884399414, 28.906810760498047, 31.092214584350586, 33.277618408203125, 35.46302032470703, 37.6484260559082, 39.83382797241211, 42.01923370361328, 44.20463562011719, 46.390037536621094, 48.575439453125, 50.76084518432617, 52.94624710083008, 55.13165283203125, 57.317054748535156, 59.50245666503906, 61.687862396240234, 63.87326431274414, 66.05867004394531, 68.24407196044922]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 15.0, 17.0, 10.0, 14.0, 26.0, 21.0, 15.0, 32.0, 31.0, 30.0, 33.0, 39.0, 23.0, 43.0, 37.0, 40.0, 49.0, 42.0, 41.0, 54.0, 34.0, 42.0, 37.0, 28.0, 38.0, 29.0, 20.0, 24.0, 21.0, 13.0, 11.0, 13.0, 13.0, 8.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.8331527709961, -90.14823150634766, -87.46330261230469, -84.77838134765625, -82.09346008300781, -79.40853118896484, -76.7236099243164, -74.03868103027344, -71.353759765625, -68.66883850097656, -65.9839096069336, -63.298988342285156, -60.61406326293945, -57.92913818359375, -55.24421691894531, -52.55929183959961, -49.874366760253906, -47.1894416809082, -44.5045166015625, -41.81959533691406, -39.13467025756836, -36.449745178222656, -33.76482391357422, -31.079898834228516, -28.394973754882812, -25.71004867553711, -23.02512550354004, -20.34020233154297, -17.655277252197266, -14.970353126525879, -12.285429000854492, -9.600505828857422, -6.9155731201171875, -4.230648994445801, -1.545724868774414, 1.1391992568969727, 3.8241233825683594, 6.509047508239746, 9.193971633911133, 11.878894805908203, 14.563819885253906, 17.24874496459961, 19.93366813659668, 22.61859130859375, 25.303516387939453, 27.988441467285156, 30.673364639282227, 33.3582878112793, 36.043212890625, 38.7281379699707, 41.413063049316406, 44.097984313964844, 46.78290939331055, 49.46783447265625, 52.15275573730469, 54.83768081665039, 57.522605895996094, 60.2075309753418, 62.8924560546875, 65.57737731933594, 68.26229858398438, 70.94722747802734, 73.63214874267578, 76.31707763671875, 79.00199890136719]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 16.0, 13.0, 21.0, 28.0, 28.0, 64.0, 102.0, 155.0, 258.0, 374.0, 557.0, 847.0, 1395.0, 2158.0, 3431.0, 5278.0, 8209.0, 12581.0, 19029.0, 28774.0, 42122.0, 59198.0, 80196.0, 101198.0, 117153.0, 121476.0, 112464.0, 94320.0, 73283.0, 53352.0, 37194.0, 25552.0, 16873.0, 10972.0, 7217.0, 4376.0, 2974.0, 1915.0, 1230.0, 748.0, 523.0, 310.0, 191.0, 143.0, 85.0, 60.0, 29.0, 36.0, 13.0, 8.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0], "bins": [-11.46875, -11.124755859375, -10.78076171875, -10.436767578125, -10.0927734375, -9.748779296875, -9.40478515625, -9.060791015625, -8.716796875, -8.372802734375, -8.02880859375, -7.684814453125, -7.3408203125, -6.996826171875, -6.65283203125, -6.308837890625, -5.96484375, -5.620849609375, -5.27685546875, -4.932861328125, -4.5888671875, -4.244873046875, -3.90087890625, -3.556884765625, -3.212890625, -2.868896484375, -2.52490234375, -2.180908203125, -1.8369140625, -1.492919921875, -1.14892578125, -0.804931640625, -0.4609375, -0.116943359375, 0.22705078125, 0.571044921875, 0.9150390625, 1.259033203125, 1.60302734375, 1.947021484375, 2.291015625, 2.635009765625, 2.97900390625, 3.322998046875, 3.6669921875, 4.010986328125, 4.35498046875, 4.698974609375, 5.04296875, 5.386962890625, 5.73095703125, 6.074951171875, 6.4189453125, 6.762939453125, 7.10693359375, 7.450927734375, 7.794921875, 8.138916015625, 8.48291015625, 8.826904296875, 9.1708984375, 9.514892578125, 9.85888671875, 10.202880859375, 10.546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 17.0, 10.0, 13.0, 24.0, 21.0, 17.0, 32.0, 31.0, 30.0, 32.0, 39.0, 26.0, 41.0, 36.0, 43.0, 43.0, 44.0, 45.0, 53.0, 33.0, 42.0, 37.0, 27.0, 39.0, 29.0, 21.0, 24.0, 22.0, 12.0, 11.0, 13.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.125, -90.431640625, -87.73828125, -85.044921875, -82.3515625, -79.658203125, -76.96484375, -74.271484375, -71.578125, -68.884765625, -66.19140625, -63.498046875, -60.8046875, -58.111328125, -55.41796875, -52.724609375, -50.03125, -47.337890625, -44.64453125, -41.951171875, -39.2578125, -36.564453125, -33.87109375, -31.177734375, -28.484375, -25.791015625, -23.09765625, -20.404296875, -17.7109375, -15.017578125, -12.32421875, -9.630859375, -6.9375, -4.244140625, -1.55078125, 1.142578125, 3.8359375, 6.529296875, 9.22265625, 11.916015625, 14.609375, 17.302734375, 19.99609375, 22.689453125, 25.3828125, 28.076171875, 30.76953125, 33.462890625, 36.15625, 38.849609375, 41.54296875, 44.236328125, 46.9296875, 49.623046875, 52.31640625, 55.009765625, 57.703125, 60.396484375, 63.08984375, 65.783203125, 68.4765625, 71.169921875, 73.86328125, 76.556640625, 79.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 7.0, 15.0, 27.0, 25.0, 50.0, 59.0, 93.0, 145.0, 186.0, 269.0, 372.0, 547.0, 832.0, 1178.0, 1696.0, 2452.0, 3394.0, 4821.0, 7015.0, 10048.0, 14711.0, 23963.0, 74384.0, 724546.0, 101644.0, 25724.0, 15959.0, 10446.0, 7107.0, 4992.0, 3537.0, 2467.0, 1698.0, 1259.0, 911.0, 585.0, 400.0, 283.0, 209.0, 138.0, 99.0, 78.0, 59.0, 49.0, 19.0, 18.0, 5.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-21.828125, -21.15771484375, -20.4873046875, -19.81689453125, -19.146484375, -18.47607421875, -17.8056640625, -17.13525390625, -16.46484375, -15.79443359375, -15.1240234375, -14.45361328125, -13.783203125, -13.11279296875, -12.4423828125, -11.77197265625, -11.1015625, -10.43115234375, -9.7607421875, -9.09033203125, -8.419921875, -7.74951171875, -7.0791015625, -6.40869140625, -5.73828125, -5.06787109375, -4.3974609375, -3.72705078125, -3.056640625, -2.38623046875, -1.7158203125, -1.04541015625, -0.375, 0.29541015625, 0.9658203125, 1.63623046875, 2.306640625, 2.97705078125, 3.6474609375, 4.31787109375, 4.98828125, 5.65869140625, 6.3291015625, 6.99951171875, 7.669921875, 8.34033203125, 9.0107421875, 9.68115234375, 10.3515625, 11.02197265625, 11.6923828125, 12.36279296875, 13.033203125, 13.70361328125, 14.3740234375, 15.04443359375, 15.71484375, 16.38525390625, 17.0556640625, 17.72607421875, 18.396484375, 19.06689453125, 19.7373046875, 20.40771484375, 21.078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 14.0, 17.0, 20.0, 8.0, 17.0, 25.0, 12.0, 21.0, 29.0, 31.0, 36.0, 27.0, 39.0, 37.0, 37.0, 42.0, 36.0, 35.0, 40.0, 40.0, 36.0, 32.0, 31.0, 33.0, 30.0, 14.0, 30.0, 22.0, 21.0, 16.0, 26.0, 17.0, 18.0, 14.0, 16.0, 8.0, 5.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.71875, -47.09619140625, -45.4736328125, -43.85107421875, -42.228515625, -40.60595703125, -38.9833984375, -37.36083984375, -35.73828125, -34.11572265625, -32.4931640625, -30.87060546875, -29.248046875, -27.62548828125, -26.0029296875, -24.38037109375, -22.7578125, -21.13525390625, -19.5126953125, -17.89013671875, -16.267578125, -14.64501953125, -13.0224609375, -11.39990234375, -9.77734375, -8.15478515625, -6.5322265625, -4.90966796875, -3.287109375, -1.66455078125, -0.0419921875, 1.58056640625, 3.203125, 4.82568359375, 6.4482421875, 8.07080078125, 9.693359375, 11.31591796875, 12.9384765625, 14.56103515625, 16.18359375, 17.80615234375, 19.4287109375, 21.05126953125, 22.673828125, 24.29638671875, 25.9189453125, 27.54150390625, 29.1640625, 30.78662109375, 32.4091796875, 34.03173828125, 35.654296875, 37.27685546875, 38.8994140625, 40.52197265625, 42.14453125, 43.76708984375, 45.3896484375, 47.01220703125, 48.634765625, 50.25732421875, 51.8798828125, 53.50244140625, 55.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 4.0, 11.0, 14.0, 30.0, 40.0, 58.0, 80.0, 144.0, 211.0, 331.0, 531.0, 927.0, 1444.0, 2398.0, 4215.0, 6922.0, 11918.0, 20799.0, 40820.0, 817038.0, 79921.0, 25590.0, 14505.0, 8258.0, 4765.0, 2925.0, 1761.0, 1099.0, 625.0, 435.0, 255.0, 166.0, 100.0, 59.0, 42.0, 24.0, 19.0, 21.0, 9.0, 6.0, 2.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.640625, -2.5416259765625, -2.442626953125, -2.3436279296875, -2.24462890625, -2.1456298828125, -2.046630859375, -1.9476318359375, -1.8486328125, -1.7496337890625, -1.650634765625, -1.5516357421875, -1.45263671875, -1.3536376953125, -1.254638671875, -1.1556396484375, -1.056640625, -0.9576416015625, -0.858642578125, -0.7596435546875, -0.66064453125, -0.5616455078125, -0.462646484375, -0.3636474609375, -0.2646484375, -0.1656494140625, -0.066650390625, 0.0323486328125, 0.13134765625, 0.2303466796875, 0.329345703125, 0.4283447265625, 0.52734375, 0.6263427734375, 0.725341796875, 0.8243408203125, 0.92333984375, 1.0223388671875, 1.121337890625, 1.2203369140625, 1.3193359375, 1.4183349609375, 1.517333984375, 1.6163330078125, 1.71533203125, 1.8143310546875, 1.913330078125, 2.0123291015625, 2.111328125, 2.2103271484375, 2.309326171875, 2.4083251953125, 2.50732421875, 2.6063232421875, 2.705322265625, 2.8043212890625, 2.9033203125, 3.0023193359375, 3.101318359375, 3.2003173828125, 3.29931640625, 3.3983154296875, 3.497314453125, 3.5963134765625, 3.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 13.0, 17.0, 13.0, 22.0, 20.0, 21.0, 21.0, 40.0, 37.0, 42.0, 48.0, 44.0, 46.0, 52.0, 53.0, 42.0, 54.0, 45.0, 50.0, 40.0, 41.0, 22.0, 30.0, 30.0, 13.0, 26.0, 22.0, 14.0, 19.0, 10.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.185075759887695e-05, -8.923280984163284e-05, -8.661486208438873e-05, -8.399691432714462e-05, -8.137896656990051e-05, -7.87610188126564e-05, -7.614307105541229e-05, -7.352512329816818e-05, -7.090717554092407e-05, -6.828922778367996e-05, -6.567128002643585e-05, -6.305333226919174e-05, -6.043538451194763e-05, -5.781743675470352e-05, -5.519948899745941e-05, -5.25815412402153e-05, -4.996359348297119e-05, -4.734564572572708e-05, -4.472769796848297e-05, -4.210975021123886e-05, -3.949180245399475e-05, -3.687385469675064e-05, -3.425590693950653e-05, -3.163795918226242e-05, -2.902001142501831e-05, -2.64020636677742e-05, -2.378411591053009e-05, -2.116616815328598e-05, -1.854822039604187e-05, -1.593027263879776e-05, -1.331232488155365e-05, -1.069437712430954e-05, -8.07642936706543e-06, -5.45848160982132e-06, -2.8405338525772095e-06, -2.2258609533309937e-07, 2.3953616619110107e-06, 5.013309419155121e-06, 7.631257176399231e-06, 1.0249204933643341e-05, 1.2867152690887451e-05, 1.548510044813156e-05, 1.810304820537567e-05, 2.072099596261978e-05, 2.333894371986389e-05, 2.5956891477108002e-05, 2.8574839234352112e-05, 3.119278699159622e-05, 3.381073474884033e-05, 3.642868250608444e-05, 3.904663026332855e-05, 4.166457802057266e-05, 4.428252577781677e-05, 4.690047353506088e-05, 4.951842129230499e-05, 5.21363690495491e-05, 5.475431680679321e-05, 5.737226456403732e-05, 5.999021232128143e-05, 6.260816007852554e-05, 6.522610783576965e-05, 6.784405559301376e-05, 7.046200335025787e-05, 7.307995110750198e-05, 7.56978988647461e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 14.0, 12.0, 18.0, 38.0, 64.0, 119.0, 200.0, 303.0, 476.0, 866.0, 1548.0, 2549.0, 4217.0, 7221.0, 12463.0, 21180.0, 34973.0, 57077.0, 91183.0, 134474.0, 171199.0, 166988.0, 125995.0, 83971.0, 52424.0, 32261.0, 19117.0, 11356.0, 6721.0, 3987.0, 2289.0, 1353.0, 751.0, 462.0, 273.0, 144.0, 101.0, 59.0, 44.0, 23.0, 12.0, 11.0, 11.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.78515625, -2.6978759765625, -2.610595703125, -2.5233154296875, -2.43603515625, -2.3487548828125, -2.261474609375, -2.1741943359375, -2.0869140625, -1.9996337890625, -1.912353515625, -1.8250732421875, -1.73779296875, -1.6505126953125, -1.563232421875, -1.4759521484375, -1.388671875, -1.3013916015625, -1.214111328125, -1.1268310546875, -1.03955078125, -0.9522705078125, -0.864990234375, -0.7777099609375, -0.6904296875, -0.6031494140625, -0.515869140625, -0.4285888671875, -0.34130859375, -0.2540283203125, -0.166748046875, -0.0794677734375, 0.0078125, 0.0950927734375, 0.182373046875, 0.2696533203125, 0.35693359375, 0.4442138671875, 0.531494140625, 0.6187744140625, 0.7060546875, 0.7933349609375, 0.880615234375, 0.9678955078125, 1.05517578125, 1.1424560546875, 1.229736328125, 1.3170166015625, 1.404296875, 1.4915771484375, 1.578857421875, 1.6661376953125, 1.75341796875, 1.8406982421875, 1.927978515625, 2.0152587890625, 2.1025390625, 2.1898193359375, 2.277099609375, 2.3643798828125, 2.45166015625, 2.5389404296875, 2.626220703125, 2.7135009765625, 2.80078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 14.0, 10.0, 15.0, 15.0, 14.0, 16.0, 18.0, 25.0, 33.0, 30.0, 36.0, 41.0, 40.0, 57.0, 42.0, 39.0, 47.0, 56.0, 54.0, 53.0, 53.0, 34.0, 34.0, 36.0, 22.0, 25.0, 22.0, 26.0, 15.0, 14.0, 7.0, 7.0, 6.0, 3.0, 12.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3271484375, -1.2866668701171875, -1.246185302734375, -1.2057037353515625, -1.16522216796875, -1.1247406005859375, -1.084259033203125, -1.0437774658203125, -1.0032958984375, -0.9628143310546875, -0.922332763671875, -0.8818511962890625, -0.84136962890625, -0.8008880615234375, -0.760406494140625, -0.7199249267578125, -0.679443359375, -0.6389617919921875, -0.598480224609375, -0.5579986572265625, -0.51751708984375, -0.4770355224609375, -0.436553955078125, -0.3960723876953125, -0.3555908203125, -0.3151092529296875, -0.274627685546875, -0.2341461181640625, -0.19366455078125, -0.1531829833984375, -0.112701416015625, -0.0722198486328125, -0.03173828125, 0.0087432861328125, 0.049224853515625, 0.0897064208984375, 0.13018798828125, 0.1706695556640625, 0.211151123046875, 0.2516326904296875, 0.2921142578125, 0.3325958251953125, 0.373077392578125, 0.4135589599609375, 0.45404052734375, 0.4945220947265625, 0.535003662109375, 0.5754852294921875, 0.615966796875, 0.6564483642578125, 0.696929931640625, 0.7374114990234375, 0.77789306640625, 0.8183746337890625, 0.858856201171875, 0.8993377685546875, 0.9398193359375, 0.9803009033203125, 1.020782470703125, 1.0612640380859375, 1.10174560546875, 1.1422271728515625, 1.182708740234375, 1.2231903076171875, 1.263671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 11.0, 5.0, 9.0, 5.0, 5.0, 13.0, 9.0, 17.0, 16.0, 27.0, 21.0, 21.0, 18.0, 32.0, 24.0, 35.0, 30.0, 37.0, 53.0, 46.0, 36.0, 43.0, 54.0, 34.0, 47.0, 35.0, 41.0, 38.0, 35.0, 29.0, 34.0, 22.0, 23.0, 16.0, 13.0, 13.0, 11.0, 8.0, 12.0, 9.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.83599090576172, -68.6427001953125, -66.44940948486328, -64.25611114501953, -62.06282043457031, -59.869529724121094, -57.676239013671875, -55.482948303222656, -53.28965377807617, -51.09636306762695, -48.90306854248047, -46.70977783203125, -44.51648712158203, -42.32319259643555, -40.12990188598633, -37.936607360839844, -35.743316650390625, -33.550025939941406, -31.356731414794922, -29.163440704345703, -26.97014808654785, -24.77685546875, -22.58356475830078, -20.39027214050293, -18.196979522705078, -16.003686904907227, -13.810395240783691, -11.617103576660156, -9.423810958862305, -7.230518341064453, -5.037226676940918, -2.843935012817383, -0.6506423950195312, 1.542649745941162, 3.7359418869018555, 5.929234027862549, 8.122526168823242, 10.315818786621094, 12.509110450744629, 14.702402114868164, 16.895694732666016, 19.088987350463867, 21.28227996826172, 23.475570678710938, 25.66886329650879, 27.86215591430664, 30.05544662475586, 32.248741149902344, 34.44203186035156, 36.63532257080078, 38.828617095947266, 41.021907806396484, 43.21520233154297, 45.40849304199219, 47.601783752441406, 49.795074462890625, 51.98836898803711, 54.18165969848633, 56.37495422363281, 58.56824493408203, 60.76153564453125, 62.954830169677734, 65.14812469482422, 67.34141540527344, 69.53470611572266]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 11.0, 18.0, 12.0, 11.0, 25.0, 21.0, 17.0, 29.0, 29.0, 29.0, 32.0, 45.0, 24.0, 38.0, 37.0, 41.0, 44.0, 41.0, 43.0, 60.0, 34.0, 40.0, 33.0, 32.0, 38.0, 31.0, 21.0, 26.0, 17.0, 18.0, 12.0, 10.0, 12.0, 9.0, 10.0, 7.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.45228576660156, -90.76252746582031, -88.07276916503906, -85.38300323486328, -82.69324493408203, -80.00348663330078, -77.313720703125, -74.62396240234375, -71.9342041015625, -69.24444580078125, -66.5546875, -63.86492156982422, -61.17516326904297, -58.48540496826172, -55.7956428527832, -53.10588073730469, -50.41612243652344, -47.72636413574219, -45.03660202026367, -42.346839904785156, -39.657081604003906, -36.967323303222656, -34.27756118774414, -31.587800979614258, -28.898040771484375, -26.208280563354492, -23.51852035522461, -20.828760147094727, -18.138999938964844, -15.449239730834961, -12.759479522705078, -10.069719314575195, -7.3799591064453125, -4.69019889831543, -2.000438690185547, 0.6893215179443359, 3.3790817260742188, 6.068841934204102, 8.758602142333984, 11.448362350463867, 14.13812255859375, 16.827882766723633, 19.517642974853516, 22.2074031829834, 24.89716339111328, 27.586923599243164, 30.276683807373047, 32.96644592285156, 35.65620422363281, 38.34596252441406, 41.03572463989258, 43.725486755371094, 46.415245056152344, 49.105003356933594, 51.79476547241211, 54.484527587890625, 57.174285888671875, 59.864044189453125, 62.55380630493164, 65.24356842041016, 67.9333267211914, 70.62308502197266, 73.31285095214844, 76.00260925292969, 78.69236755371094]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 20.0, 34.0, 47.0, 111.0, 140.0, 215.0, 443.0, 662.0, 1145.0, 1737.0, 2901.0, 4831.0, 7677.0, 11948.0, 18496.0, 27974.0, 39692.0, 54878.0, 70863.0, 86648.0, 99660.0, 106413.0, 105433.0, 97258.0, 83167.0, 67487.0, 50953.0, 36527.0, 25468.0, 16766.0, 11006.0, 6938.0, 4235.0, 2617.0, 1585.0, 1020.0, 631.0, 376.0, 207.0, 148.0, 87.0, 39.0, 31.0, 13.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.625, -42.11474609375, -40.6044921875, -39.09423828125, -37.583984375, -36.07373046875, -34.5634765625, -33.05322265625, -31.54296875, -30.03271484375, -28.5224609375, -27.01220703125, -25.501953125, -23.99169921875, -22.4814453125, -20.97119140625, -19.4609375, -17.95068359375, -16.4404296875, -14.93017578125, -13.419921875, -11.90966796875, -10.3994140625, -8.88916015625, -7.37890625, -5.86865234375, -4.3583984375, -2.84814453125, -1.337890625, 0.17236328125, 1.6826171875, 3.19287109375, 4.703125, 6.21337890625, 7.7236328125, 9.23388671875, 10.744140625, 12.25439453125, 13.7646484375, 15.27490234375, 16.78515625, 18.29541015625, 19.8056640625, 21.31591796875, 22.826171875, 24.33642578125, 25.8466796875, 27.35693359375, 28.8671875, 30.37744140625, 31.8876953125, 33.39794921875, 34.908203125, 36.41845703125, 37.9287109375, 39.43896484375, 40.94921875, 42.45947265625, 43.9697265625, 45.47998046875, 46.990234375, 48.50048828125, 50.0107421875, 51.52099609375, 53.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 16.0, 13.0, 10.0, 25.0, 20.0, 20.0, 28.0, 25.0, 31.0, 32.0, 47.0, 23.0, 38.0, 38.0, 40.0, 43.0, 46.0, 43.0, 57.0, 36.0, 37.0, 34.0, 31.0, 43.0, 27.0, 23.0, 24.0, 19.0, 15.0, 15.0, 7.0, 13.0, 9.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-92.6875, -90.01953125, -87.3515625, -84.68359375, -82.015625, -79.34765625, -76.6796875, -74.01171875, -71.34375, -68.67578125, -66.0078125, -63.33984375, -60.671875, -58.00390625, -55.3359375, -52.66796875, -50.0, -47.33203125, -44.6640625, -41.99609375, -39.328125, -36.66015625, -33.9921875, -31.32421875, -28.65625, -25.98828125, -23.3203125, -20.65234375, -17.984375, -15.31640625, -12.6484375, -9.98046875, -7.3125, -4.64453125, -1.9765625, 0.69140625, 3.359375, 6.02734375, 8.6953125, 11.36328125, 14.03125, 16.69921875, 19.3671875, 22.03515625, 24.703125, 27.37109375, 30.0390625, 32.70703125, 35.375, 38.04296875, 40.7109375, 43.37890625, 46.046875, 48.71484375, 51.3828125, 54.05078125, 56.71875, 59.38671875, 62.0546875, 64.72265625, 67.390625, 70.05859375, 72.7265625, 75.39453125, 78.0625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 9.0, 9.0, 22.0, 32.0, 68.0, 71.0, 103.0, 153.0, 271.0, 414.0, 631.0, 995.0, 1500.0, 2304.0, 3505.0, 5185.0, 7791.0, 11432.0, 16503.0, 23059.0, 31627.0, 42442.0, 54730.0, 66771.0, 78688.0, 88135.0, 91781.0, 91967.0, 86992.0, 77478.0, 66007.0, 53362.0, 41624.0, 31005.0, 22592.0, 15928.0, 11040.0, 7514.0, 5101.0, 3404.0, 2209.0, 1364.0, 961.0, 616.0, 423.0, 274.0, 183.0, 111.0, 58.0, 43.0, 35.0, 15.0, 11.0, 6.0, 3.0, 1.0, 4.0, 2.0], "bins": [-47.28125, -45.8466796875, -44.412109375, -42.9775390625, -41.54296875, -40.1083984375, -38.673828125, -37.2392578125, -35.8046875, -34.3701171875, -32.935546875, -31.5009765625, -30.06640625, -28.6318359375, -27.197265625, -25.7626953125, -24.328125, -22.8935546875, -21.458984375, -20.0244140625, -18.58984375, -17.1552734375, -15.720703125, -14.2861328125, -12.8515625, -11.4169921875, -9.982421875, -8.5478515625, -7.11328125, -5.6787109375, -4.244140625, -2.8095703125, -1.375, 0.0595703125, 1.494140625, 2.9287109375, 4.36328125, 5.7978515625, 7.232421875, 8.6669921875, 10.1015625, 11.5361328125, 12.970703125, 14.4052734375, 15.83984375, 17.2744140625, 18.708984375, 20.1435546875, 21.578125, 23.0126953125, 24.447265625, 25.8818359375, 27.31640625, 28.7509765625, 30.185546875, 31.6201171875, 33.0546875, 34.4892578125, 35.923828125, 37.3583984375, 38.79296875, 40.2275390625, 41.662109375, 43.0966796875, 44.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 14.0, 12.0, 15.0, 19.0, 25.0, 20.0, 16.0, 28.0, 28.0, 36.0, 39.0, 36.0, 40.0, 42.0, 37.0, 49.0, 43.0, 38.0, 37.0, 29.0, 35.0, 49.0, 32.0, 34.0, 30.0, 23.0, 17.0, 24.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 8.0, 9.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.24755859375, -48.4638671875, -46.68017578125, -44.896484375, -43.11279296875, -41.3291015625, -39.54541015625, -37.76171875, -35.97802734375, -34.1943359375, -32.41064453125, -30.626953125, -28.84326171875, -27.0595703125, -25.27587890625, -23.4921875, -21.70849609375, -19.9248046875, -18.14111328125, -16.357421875, -14.57373046875, -12.7900390625, -11.00634765625, -9.22265625, -7.43896484375, -5.6552734375, -3.87158203125, -2.087890625, -0.30419921875, 1.4794921875, 3.26318359375, 5.046875, 6.83056640625, 8.6142578125, 10.39794921875, 12.181640625, 13.96533203125, 15.7490234375, 17.53271484375, 19.31640625, 21.10009765625, 22.8837890625, 24.66748046875, 26.451171875, 28.23486328125, 30.0185546875, 31.80224609375, 33.5859375, 35.36962890625, 37.1533203125, 38.93701171875, 40.720703125, 42.50439453125, 44.2880859375, 46.07177734375, 47.85546875, 49.63916015625, 51.4228515625, 53.20654296875, 54.990234375, 56.77392578125, 58.5576171875, 60.34130859375, 62.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 7.0, 18.0, 13.0, 38.0, 61.0, 100.0, 161.0, 280.0, 485.0, 790.0, 1352.0, 2301.0, 4096.0, 6875.0, 11507.0, 19034.0, 30302.0, 45594.0, 65563.0, 87105.0, 107075.0, 119980.0, 122091.0, 112278.0, 94523.0, 72608.0, 52559.0, 35335.0, 22484.0, 13991.0, 8297.0, 4948.0, 2803.0, 1631.0, 925.0, 538.0, 310.0, 186.0, 116.0, 67.0, 43.0, 31.0, 20.0, 11.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-23.578125, -22.867431640625, -22.15673828125, -21.446044921875, -20.7353515625, -20.024658203125, -19.31396484375, -18.603271484375, -17.892578125, -17.181884765625, -16.47119140625, -15.760498046875, -15.0498046875, -14.339111328125, -13.62841796875, -12.917724609375, -12.20703125, -11.496337890625, -10.78564453125, -10.074951171875, -9.3642578125, -8.653564453125, -7.94287109375, -7.232177734375, -6.521484375, -5.810791015625, -5.10009765625, -4.389404296875, -3.6787109375, -2.968017578125, -2.25732421875, -1.546630859375, -0.8359375, -0.125244140625, 0.58544921875, 1.296142578125, 2.0068359375, 2.717529296875, 3.42822265625, 4.138916015625, 4.849609375, 5.560302734375, 6.27099609375, 6.981689453125, 7.6923828125, 8.403076171875, 9.11376953125, 9.824462890625, 10.53515625, 11.245849609375, 11.95654296875, 12.667236328125, 13.3779296875, 14.088623046875, 14.79931640625, 15.510009765625, 16.220703125, 16.931396484375, 17.64208984375, 18.352783203125, 19.0634765625, 19.774169921875, 20.48486328125, 21.195556640625, 21.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 14.0, 25.0, 19.0, 26.0, 18.0, 38.0, 49.0, 30.0, 46.0, 49.0, 39.0, 47.0, 57.0, 49.0, 48.0, 47.0, 42.0, 45.0, 37.0, 31.0, 34.0, 32.0, 23.0, 21.0, 16.0, 14.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028400421142578125, -0.0027502477169036865, -0.0026604533195495605, -0.0025706589221954346, -0.0024808645248413086, -0.0023910701274871826, -0.0023012757301330566, -0.0022114813327789307, -0.0021216869354248047, -0.0020318925380706787, -0.0019420981407165527, -0.0018523037433624268, -0.0017625093460083008, -0.0016727149486541748, -0.0015829205513000488, -0.0014931261539459229, -0.0014033317565917969, -0.001313537359237671, -0.001223742961883545, -0.001133948564529419, -0.001044154167175293, -0.000954359769821167, -0.000864565372467041, -0.000774770975112915, -0.0006849765777587891, -0.0005951821804046631, -0.0005053877830505371, -0.00041559338569641113, -0.00032579898834228516, -0.00023600459098815918, -0.0001462101936340332, -5.6415796279907227e-05, 3.337860107421875e-05, 0.00012317299842834473, 0.0002129673957824707, 0.0003027617931365967, 0.00039255619049072266, 0.00048235058784484863, 0.0005721449851989746, 0.0006619393825531006, 0.0007517337799072266, 0.0008415281772613525, 0.0009313225746154785, 0.0010211169719696045, 0.0011109113693237305, 0.0012007057666778564, 0.0012905001640319824, 0.0013802945613861084, 0.0014700889587402344, 0.0015598833560943604, 0.0016496777534484863, 0.0017394721508026123, 0.0018292665481567383, 0.0019190609455108643, 0.0020088553428649902, 0.002098649740219116, 0.002188444137573242, 0.002278238534927368, 0.002368032932281494, 0.00245782732963562, 0.002547621726989746, 0.002637416124343872, 0.002727210521697998, 0.002817004919052124, 0.00290679931640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 14.0, 18.0, 31.0, 34.0, 63.0, 101.0, 174.0, 277.0, 415.0, 652.0, 1083.0, 1661.0, 2605.0, 4134.0, 6115.0, 9402.0, 13553.0, 19606.0, 27198.0, 37052.0, 47712.0, 59921.0, 71899.0, 82279.0, 89032.0, 91428.0, 89238.0, 82608.0, 73386.0, 61071.0, 48568.0, 37712.0, 27819.0, 20028.0, 13964.0, 9401.0, 6433.0, 4274.0, 2799.0, 1804.0, 1067.0, 768.0, 412.0, 262.0, 173.0, 110.0, 82.0, 47.0, 30.0, 11.0, 10.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0], "bins": [-17.953125, -17.4013671875, -16.849609375, -16.2978515625, -15.74609375, -15.1943359375, -14.642578125, -14.0908203125, -13.5390625, -12.9873046875, -12.435546875, -11.8837890625, -11.33203125, -10.7802734375, -10.228515625, -9.6767578125, -9.125, -8.5732421875, -8.021484375, -7.4697265625, -6.91796875, -6.3662109375, -5.814453125, -5.2626953125, -4.7109375, -4.1591796875, -3.607421875, -3.0556640625, -2.50390625, -1.9521484375, -1.400390625, -0.8486328125, -0.296875, 0.2548828125, 0.806640625, 1.3583984375, 1.91015625, 2.4619140625, 3.013671875, 3.5654296875, 4.1171875, 4.6689453125, 5.220703125, 5.7724609375, 6.32421875, 6.8759765625, 7.427734375, 7.9794921875, 8.53125, 9.0830078125, 9.634765625, 10.1865234375, 10.73828125, 11.2900390625, 11.841796875, 12.3935546875, 12.9453125, 13.4970703125, 14.048828125, 14.6005859375, 15.15234375, 15.7041015625, 16.255859375, 16.8076171875, 17.359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 11.0, 4.0, 12.0, 18.0, 22.0, 18.0, 24.0, 35.0, 36.0, 31.0, 38.0, 39.0, 38.0, 47.0, 41.0, 36.0, 56.0, 44.0, 41.0, 47.0, 33.0, 51.0, 37.0, 34.0, 32.0, 28.0, 27.0, 21.0, 18.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.8963623046875, -9.573974609375, -9.2515869140625, -8.92919921875, -8.6068115234375, -8.284423828125, -7.9620361328125, -7.6396484375, -7.3172607421875, -6.994873046875, -6.6724853515625, -6.35009765625, -6.0277099609375, -5.705322265625, -5.3829345703125, -5.060546875, -4.7381591796875, -4.415771484375, -4.0933837890625, -3.77099609375, -3.4486083984375, -3.126220703125, -2.8038330078125, -2.4814453125, -2.1590576171875, -1.836669921875, -1.5142822265625, -1.19189453125, -0.8695068359375, -0.547119140625, -0.2247314453125, 0.09765625, 0.4200439453125, 0.742431640625, 1.0648193359375, 1.38720703125, 1.7095947265625, 2.031982421875, 2.3543701171875, 2.6767578125, 2.9991455078125, 3.321533203125, 3.6439208984375, 3.96630859375, 4.2886962890625, 4.611083984375, 4.9334716796875, 5.255859375, 5.5782470703125, 5.900634765625, 6.2230224609375, 6.54541015625, 6.8677978515625, 7.190185546875, 7.5125732421875, 7.8349609375, 8.1573486328125, 8.479736328125, 8.8021240234375, 9.12451171875, 9.4468994140625, 9.769287109375, 10.0916748046875, 10.4140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 2.0, 12.0, 6.0, 11.0, 14.0, 16.0, 17.0, 24.0, 17.0, 21.0, 22.0, 29.0, 26.0, 27.0, 29.0, 33.0, 36.0, 51.0, 37.0, 33.0, 45.0, 40.0, 43.0, 39.0, 36.0, 42.0, 36.0, 36.0, 28.0, 23.0, 15.0, 19.0, 18.0, 12.0, 12.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-73.91032409667969, -71.82327270507812, -69.73622131347656, -67.64917755126953, -65.56212615966797, -63.475074768066406, -61.38802719116211, -59.30097961425781, -57.21392822265625, -55.12687683105469, -53.03982925415039, -50.952781677246094, -48.86573028564453, -46.77867889404297, -44.69163131713867, -42.604583740234375, -40.51753234863281, -38.43048095703125, -36.34343338012695, -34.256385803222656, -32.169334411621094, -30.082284927368164, -27.995235443115234, -25.908185958862305, -23.821136474609375, -21.734086990356445, -19.647037506103516, -17.559988021850586, -15.472938537597656, -13.385889053344727, -11.298839569091797, -9.211790084838867, -7.124744415283203, -5.037694931030273, -2.9506454467773438, -0.8635959625244141, 1.2234535217285156, 3.3105030059814453, 5.397552490234375, 7.484601974487305, 9.571651458740234, 11.658700942993164, 13.745750427246094, 15.832799911499023, 17.919849395751953, 20.006898880004883, 22.093948364257812, 24.180997848510742, 26.268047332763672, 28.3550968170166, 30.44214630126953, 32.529197692871094, 34.61624526977539, 36.70329284667969, 38.79034423828125, 40.87739562988281, 42.96444320678711, 45.051490783691406, 47.13854217529297, 49.22559356689453, 51.31264114379883, 53.399688720703125, 55.48674011230469, 57.57379150390625, 59.66083908081055]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 9.0, 4.0, 15.0, 9.0, 13.0, 21.0, 20.0, 16.0, 19.0, 27.0, 32.0, 30.0, 32.0, 31.0, 45.0, 42.0, 39.0, 36.0, 51.0, 45.0, 48.0, 36.0, 47.0, 42.0, 53.0, 36.0, 23.0, 24.0, 16.0, 13.0, 10.0, 21.0, 16.0, 12.0, 9.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-97.46207427978516, -94.4552993774414, -91.44853210449219, -88.44175720214844, -85.43498229980469, -82.42821502685547, -79.42144012451172, -76.4146728515625, -73.40789794921875, -70.401123046875, -67.39435577392578, -64.38758087158203, -61.38080978393555, -58.37403869628906, -55.36726379394531, -52.36049270629883, -49.353721618652344, -46.34695053100586, -43.340179443359375, -40.333404541015625, -37.32663345336914, -34.319862365722656, -31.31308937072754, -28.306316375732422, -25.299545288085938, -22.292774200439453, -19.286001205444336, -16.27922821044922, -13.272457122802734, -10.265685081481934, -7.258913040161133, -4.252140045166016, -1.245361328125, 1.7614107131958008, 4.768182754516602, 7.774954795837402, 10.781726837158203, 13.788498878479004, 16.795270919799805, 19.802043914794922, 22.808815002441406, 25.81558609008789, 28.822359085083008, 31.829132080078125, 34.83590316772461, 37.842674255371094, 40.849449157714844, 43.85622024536133, 46.86299133300781, 49.8697624206543, 52.87653350830078, 55.88330841064453, 58.890079498291016, 61.8968505859375, 64.90362548828125, 67.910400390625, 70.91716766357422, 73.92394256591797, 76.93070983886719, 79.93748474121094, 82.94425964355469, 85.9510269165039, 88.95780181884766, 91.96456909179688, 94.97134399414062]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 8.0, 12.0, 18.0, 30.0, 46.0, 45.0, 61.0, 86.0, 133.0, 173.0, 212.0, 318.0, 467.0, 525.0, 647.0, 858.0, 1179.0, 1432.0, 1762.0, 2116.0, 2523.0, 2869.0, 3354.0, 1009523.0, 4180.0, 3228.0, 2842.0, 2398.0, 1986.0, 1670.0, 1310.0, 1052.0, 854.0, 652.0, 509.0, 365.0, 290.0, 251.0, 180.0, 122.0, 89.0, 62.0, 44.0, 26.0, 19.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 8.0, 3.0], "bins": [-596.8502197265625, -579.7380981445312, -562.6259155273438, -545.5137939453125, -528.4016723632812, -511.2895202636719, -494.1773681640625, -477.06524658203125, -459.9530944824219, -442.8409423828125, -425.72882080078125, -408.6166687011719, -391.5045166015625, -374.39239501953125, -357.2802429199219, -340.1680908203125, -323.05596923828125, -305.9438171386719, -288.8316955566406, -271.71954345703125, -254.60740661621094, -237.49526977539062, -220.38311767578125, -203.27098083496094, -186.15884399414062, -169.0467071533203, -151.9345703125, -134.82241821289062, -117.71028137207031, -100.59814453125, -83.48600006103516, -66.37385559082031, -49.261688232421875, -32.1495475769043, -15.037406921386719, 2.0747337341308594, 19.186874389648438, 36.29901123046875, 53.411155700683594, 70.52330017089844, 87.63543701171875, 104.74757385253906, 121.8597183227539, 138.97186279296875, 156.08399963378906, 173.19613647460938, 190.30828857421875, 207.42042541503906, 224.53256225585938, 241.6446990966797, 258.7568359375, 275.8689880371094, 292.98114013671875, 310.09326171875, 327.2054138183594, 344.31756591796875, 361.4296875, 378.5418395996094, 395.6539611816406, 412.76611328125, 429.87823486328125, 446.9903869628906, 464.1025390625, 481.21466064453125, 498.3268127441406]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 16.0, 18.0, 32.0, 47.0, 70.0, 116.0, 170.0, 250.0, 357.0, 509.0, 735.0, 1129.0, 1613.0, 2294.0, 3526.0, 5220.0, 8417.0, 15285.0, 33200.0, 51317824.0, 37883.0, 16696.0, 8907.0, 5475.0, 3691.0, 2394.0, 1714.0, 1191.0, 830.0, 555.0, 411.0, 232.0, 171.0, 119.0, 66.0, 60.0, 37.0, 28.0, 13.0, 9.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-682.1965942382812, -659.1227416992188, -636.0489501953125, -612.97509765625, -589.9012451171875, -566.8274536132812, -543.7536010742188, -520.6798095703125, -497.60595703125, -474.5321350097656, -451.4582824707031, -428.38446044921875, -405.3106384277344, -382.23681640625, -359.1629638671875, -336.0891418457031, -313.0152893066406, -289.94146728515625, -266.86761474609375, -243.79379272460938, -220.719970703125, -197.64613342285156, -174.57229614257812, -151.49847412109375, -128.4246368408203, -105.3508071899414, -82.2769775390625, -59.20314025878906, -36.129310607910156, -13.05548095703125, 10.018356323242188, 33.09217834472656, 56.166015625, 79.2398452758789, 102.31367492675781, 125.38751220703125, 148.46133422851562, 171.53517150878906, 194.6090087890625, 217.68283081054688, 240.7566680908203, 263.83050537109375, 286.9043273925781, 309.9781494140625, 333.052001953125, 356.1258239746094, 379.19964599609375, 402.27349853515625, 425.3473205566406, 448.421142578125, 471.4949951171875, 494.5688171386719, 517.6426391601562, 540.7164916992188, 563.790283203125, 586.8641357421875, 609.93798828125, 633.0118408203125, 656.0856323242188, 679.1594848632812, 702.2333374023438, 725.30712890625, 748.3809814453125, 771.454833984375, 794.5286254882812]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 5.0, 12.0, 11.0, 12.0, 9.0, 21.0, 29.0, 28.0, 45.0, 47.0, 64.0, 63.0, 89.0, 82.0, 74.0, 84.0, 62.0, 47.0, 51.0, 34.0, 29.0, 23.0, 17.0, 14.0, 11.0, 9.0, 6.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-522.4603271484375, -500.36871337890625, -478.277099609375, -456.18548583984375, -434.0938720703125, -412.00225830078125, -389.9106140136719, -367.8190002441406, -345.7273864746094, -323.6357727050781, -301.5441589355469, -279.4525146484375, -257.36090087890625, -235.26930236816406, -213.17767333984375, -191.0860595703125, -168.99444580078125, -146.90283203125, -124.81121063232422, -102.71958923339844, -80.62797546386719, -58.53636169433594, -36.444732666015625, -14.353118896484375, 7.738494873046875, 29.83011245727539, 51.921730041503906, 74.01335144042969, 96.10496520996094, 118.19657897949219, 140.2882080078125, 162.37982177734375, 184.471435546875, 206.56304931640625, 228.6546630859375, 250.7462921142578, 272.837890625, 294.92950439453125, 317.0211486816406, 339.1127624511719, 361.2043762207031, 383.2959899902344, 405.3876037597656, 427.479248046875, 449.57086181640625, 471.6624755859375, 493.75408935546875, 515.845703125, 537.9373168945312, 560.0289306640625, 582.1205444335938, 604.212158203125, 626.3037719726562, 648.3953857421875, 670.487060546875, 692.57861328125, 714.6702880859375, 736.7619018554688, 758.853515625, 780.9451293945312, 803.0367431640625, 825.1283569335938, 847.219970703125, 869.3116455078125, 891.4031982421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 10.0, 15.0, 13.0, 17.0, 23.0, 23.0, 30.0, 24.0, 31.0, 36.0, 47.0, 29.0, 55.0, 64.0, 65.0, 56.0, 51.0, 53.0, 43.0, 38.0, 45.0, 32.0, 23.0, 29.0, 15.0, 15.0, 13.0, 19.0, 11.0, 11.0, 4.0, 9.0, 5.0, 13.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-685.2730712890625, -664.1161499023438, -642.959228515625, -621.80224609375, -600.6453247070312, -579.4884033203125, -558.3314208984375, -537.1744995117188, -516.017578125, -494.86065673828125, -473.7037048339844, -452.5467529296875, -431.38983154296875, -410.23291015625, -389.0759582519531, -367.91900634765625, -346.7620849609375, -325.60516357421875, -304.4482116699219, -283.291259765625, -262.13433837890625, -240.97740173339844, -219.82046508789062, -198.6635284423828, -177.506591796875, -156.3496551513672, -135.19271850585938, -114.03578186035156, -92.87884521484375, -71.72190856933594, -50.564971923828125, -29.408035278320312, -8.25115966796875, 12.905776977539062, 34.062713623046875, 55.21965026855469, 76.3765869140625, 97.53352355957031, 118.69046020507812, 139.84739685058594, 161.00433349609375, 182.16127014160156, 203.31820678710938, 224.4751434326172, 245.632080078125, 266.78900146484375, 287.9459533691406, 309.1029052734375, 330.25982666015625, 351.416748046875, 372.5736999511719, 393.73065185546875, 414.8875732421875, 436.04449462890625, 457.2014465332031, 478.3583984375, 499.51531982421875, 520.6722412109375, 541.8292236328125, 562.9861450195312, 584.14306640625, 605.2999877929688, 626.4569091796875, 647.6138916015625, 668.7708129882812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 19.0, 15.0, 26.0, 43.0, 34.0, 71.0, 132.0, 210.0, 231.0, 366.0, 487.0, 806.0, 1212.0, 1887.0, 2929.0, 4771.0, 8133.0, 14753.0, 30545.0, 72491.0, 218260.0, 1744524.0, 1740637.0, 212032.0, 71431.0, 30100.0, 14913.0, 8406.0, 5041.0, 3223.0, 2068.0, 1383.0, 963.0, 647.0, 433.0, 319.0, 237.0, 139.0, 97.0, 81.0, 54.0, 38.0, 21.0, 16.0, 16.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.953125, -21.26708984375, -20.5810546875, -19.89501953125, -19.208984375, -18.52294921875, -17.8369140625, -17.15087890625, -16.46484375, -15.77880859375, -15.0927734375, -14.40673828125, -13.720703125, -13.03466796875, -12.3486328125, -11.66259765625, -10.9765625, -10.29052734375, -9.6044921875, -8.91845703125, -8.232421875, -7.54638671875, -6.8603515625, -6.17431640625, -5.48828125, -4.80224609375, -4.1162109375, -3.43017578125, -2.744140625, -2.05810546875, -1.3720703125, -0.68603515625, 0.0, 0.68603515625, 1.3720703125, 2.05810546875, 2.744140625, 3.43017578125, 4.1162109375, 4.80224609375, 5.48828125, 6.17431640625, 6.8603515625, 7.54638671875, 8.232421875, 8.91845703125, 9.6044921875, 10.29052734375, 10.9765625, 11.66259765625, 12.3486328125, 13.03466796875, 13.720703125, 14.40673828125, 15.0927734375, 15.77880859375, 16.46484375, 17.15087890625, 17.8369140625, 18.52294921875, 19.208984375, 19.89501953125, 20.5810546875, 21.26708984375, 21.953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 15.0, 26.0, 28.0, 45.0, 56.0, 71.0, 89.0, 106.0, 103.0, 92.0, 97.0, 49.0, 49.0, 35.0, 29.0, 18.0, 12.0, 8.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.27099609375, -2.1962890625, -2.12158203125, -2.046875, -1.97216796875, -1.8974609375, -1.82275390625, -1.748046875, -1.67333984375, -1.5986328125, -1.52392578125, -1.44921875, -1.37451171875, -1.2998046875, -1.22509765625, -1.150390625, -1.07568359375, -1.0009765625, -0.92626953125, -0.8515625, -0.77685546875, -0.7021484375, -0.62744140625, -0.552734375, -0.47802734375, -0.4033203125, -0.32861328125, -0.25390625, -0.17919921875, -0.1044921875, -0.02978515625, 0.044921875, 0.11962890625, 0.1943359375, 0.26904296875, 0.34375, 0.41845703125, 0.4931640625, 0.56787109375, 0.642578125, 0.71728515625, 0.7919921875, 0.86669921875, 0.94140625, 1.01611328125, 1.0908203125, 1.16552734375, 1.240234375, 1.31494140625, 1.3896484375, 1.46435546875, 1.5390625, 1.61376953125, 1.6884765625, 1.76318359375, 1.837890625, 1.91259765625, 1.9873046875, 2.06201171875, 2.13671875, 2.21142578125, 2.2861328125, 2.36083984375, 2.435546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 13.0, 19.0, 39.0, 47.0, 79.0, 96.0, 165.0, 213.0, 408.0, 640.0, 1160.0, 2180.0, 4869.0, 11423.0, 29105.0, 87300.0, 318323.0, 2193349.0, 1185279.0, 245429.0, 71245.0, 24468.0, 9447.0, 4216.0, 2025.0, 1028.0, 602.0, 369.0, 228.0, 137.0, 103.0, 54.0, 52.0, 36.0, 28.0, 12.0, 19.0, 14.0, 2.0, 4.0, 2.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.7119140625, -18.064453125, -17.4169921875, -16.76953125, -16.1220703125, -15.474609375, -14.8271484375, -14.1796875, -13.5322265625, -12.884765625, -12.2373046875, -11.58984375, -10.9423828125, -10.294921875, -9.6474609375, -9.0, -8.3525390625, -7.705078125, -7.0576171875, -6.41015625, -5.7626953125, -5.115234375, -4.4677734375, -3.8203125, -3.1728515625, -2.525390625, -1.8779296875, -1.23046875, -0.5830078125, 0.064453125, 0.7119140625, 1.359375, 2.0068359375, 2.654296875, 3.3017578125, 3.94921875, 4.5966796875, 5.244140625, 5.8916015625, 6.5390625, 7.1865234375, 7.833984375, 8.4814453125, 9.12890625, 9.7763671875, 10.423828125, 11.0712890625, 11.71875, 12.3662109375, 13.013671875, 13.6611328125, 14.30859375, 14.9560546875, 15.603515625, 16.2509765625, 16.8984375, 17.5458984375, 18.193359375, 18.8408203125, 19.48828125, 20.1357421875, 20.783203125, 21.4306640625, 22.078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 12.0, 11.0, 21.0, 19.0, 38.0, 29.0, 47.0, 47.0, 53.0, 92.0, 109.0, 143.0, 186.0, 240.0, 334.0, 910.0, 463.0, 286.0, 211.0, 164.0, 132.0, 92.0, 92.0, 79.0, 44.0, 42.0, 33.0, 29.0, 19.0, 22.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.2979736328125, -5.119384765625, -4.9407958984375, -4.76220703125, -4.5836181640625, -4.405029296875, -4.2264404296875, -4.0478515625, -3.8692626953125, -3.690673828125, -3.5120849609375, -3.33349609375, -3.1549072265625, -2.976318359375, -2.7977294921875, -2.619140625, -2.4405517578125, -2.261962890625, -2.0833740234375, -1.90478515625, -1.7261962890625, -1.547607421875, -1.3690185546875, -1.1904296875, -1.0118408203125, -0.833251953125, -0.6546630859375, -0.47607421875, -0.2974853515625, -0.118896484375, 0.0596923828125, 0.23828125, 0.4168701171875, 0.595458984375, 0.7740478515625, 0.95263671875, 1.1312255859375, 1.309814453125, 1.4884033203125, 1.6669921875, 1.8455810546875, 2.024169921875, 2.2027587890625, 2.38134765625, 2.5599365234375, 2.738525390625, 2.9171142578125, 3.095703125, 3.2742919921875, 3.452880859375, 3.6314697265625, 3.81005859375, 3.9886474609375, 4.167236328125, 4.3458251953125, 4.5244140625, 4.7030029296875, 4.881591796875, 5.0601806640625, 5.23876953125, 5.4173583984375, 5.595947265625, 5.7745361328125, 5.953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 19.0, 25.0, 42.0, 74.0, 91.0, 97.0, 95.0, 106.0, 107.0, 76.0, 64.0, 48.0, 24.0, 31.0, 17.0, 18.0, 10.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.60264587402344, -37.04033279418945, -35.4780158996582, -33.91570281982422, -32.35338592529297, -30.791072845458984, -29.228757858276367, -27.66644287109375, -26.104129791259766, -24.54181480407715, -22.97949981689453, -21.417186737060547, -19.85487174987793, -18.292556762695312, -16.730241775512695, -15.167927742004395, -13.605611801147461, -12.043296813964844, -10.480982780456543, -8.918667793273926, -7.356353282928467, -5.794038772583008, -4.231723785400391, -2.66940975189209, -1.1070947647094727, 0.4552198648452759, 2.0175344944000244, 3.5798492431640625, 5.1421637535095215, 6.7044782638549805, 8.266793251037598, 9.829107284545898, 11.391422271728516, 12.953737258911133, 14.516051292419434, 16.078365325927734, 17.64068031311035, 19.20299530029297, 20.765310287475586, 22.327625274658203, 23.889938354492188, 25.452253341674805, 27.014568328857422, 28.576881408691406, 30.139196395874023, 31.70151138305664, 33.263824462890625, 34.826141357421875, 36.388458251953125, 37.95077133178711, 39.51308822631836, 41.075401306152344, 42.637718200683594, 44.20003128051758, 45.76234436035156, 47.32466125488281, 48.8869743347168, 50.44928741455078, 52.01160430908203, 53.573917388916016, 55.136234283447266, 56.69854736328125, 58.2608642578125, 59.823177337646484, 61.38549041748047]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 18.0, 23.0, 26.0, 20.0, 24.0, 23.0, 27.0, 36.0, 37.0, 40.0, 48.0, 30.0, 43.0, 45.0, 41.0, 43.0, 41.0, 36.0, 53.0, 48.0, 41.0, 25.0, 31.0, 31.0, 18.0, 15.0, 15.0, 17.0, 11.0, 9.0, 10.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.839374542236328, -27.942052841186523, -27.04473114013672, -26.147411346435547, -25.250089645385742, -24.352767944335938, -23.455446243286133, -22.558124542236328, -21.660802841186523, -20.76348114013672, -19.866159439086914, -18.96883773803711, -18.071517944335938, -17.174196243286133, -16.276874542236328, -15.379552841186523, -14.482232093811035, -13.58491039276123, -12.687589645385742, -11.790267944335938, -10.892946243286133, -9.995624542236328, -9.09830379486084, -8.200982093811035, -7.303660869598389, -6.406339645385742, -5.5090179443359375, -4.611696720123291, -3.7143752574920654, -2.81705379486084, -1.9197325706481934, -1.0224108695983887, -0.1250896453857422, 0.7722317576408386, 1.6695531606674194, 2.5668745040893555, 3.464195966720581, 4.361517429351807, 5.258838653564453, 6.156160354614258, 7.053481578826904, 7.950802803039551, 8.848124504089355, 9.745445251464844, 10.642766952514648, 11.540088653564453, 12.437410354614258, 13.334732055664062, 14.23205280303955, 15.129374504089355, 16.026695251464844, 16.92401695251465, 17.821338653564453, 18.718660354614258, 19.615982055664062, 20.513301849365234, 21.41062355041504, 22.307945251464844, 23.20526695251465, 24.102588653564453, 24.999908447265625, 25.89723014831543, 26.794551849365234, 27.69187355041504, 28.589195251464844]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 3.0, 13.0, 14.0, 21.0, 21.0, 37.0, 48.0, 74.0, 128.0, 167.0, 282.0, 450.0, 691.0, 1154.0, 2068.0, 3930.0, 8130.0, 19257.0, 51896.0, 172421.0, 447539.0, 229764.0, 66582.0, 23472.0, 9842.0, 4600.0, 2316.0, 1429.0, 795.0, 502.0, 283.0, 210.0, 129.0, 85.0, 69.0, 37.0, 27.0, 23.0, 8.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.296875, -27.42919921875, -26.5615234375, -25.69384765625, -24.826171875, -23.95849609375, -23.0908203125, -22.22314453125, -21.35546875, -20.48779296875, -19.6201171875, -18.75244140625, -17.884765625, -17.01708984375, -16.1494140625, -15.28173828125, -14.4140625, -13.54638671875, -12.6787109375, -11.81103515625, -10.943359375, -10.07568359375, -9.2080078125, -8.34033203125, -7.47265625, -6.60498046875, -5.7373046875, -4.86962890625, -4.001953125, -3.13427734375, -2.2666015625, -1.39892578125, -0.53125, 0.33642578125, 1.2041015625, 2.07177734375, 2.939453125, 3.80712890625, 4.6748046875, 5.54248046875, 6.41015625, 7.27783203125, 8.1455078125, 9.01318359375, 9.880859375, 10.74853515625, 11.6162109375, 12.48388671875, 13.3515625, 14.21923828125, 15.0869140625, 15.95458984375, 16.822265625, 17.68994140625, 18.5576171875, 19.42529296875, 20.29296875, 21.16064453125, 22.0283203125, 22.89599609375, 23.763671875, 24.63134765625, 25.4990234375, 26.36669921875, 27.234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 13.0, 15.0, 14.0, 24.0, 27.0, 40.0, 58.0, 72.0, 74.0, 93.0, 94.0, 90.0, 85.0, 59.0, 53.0, 33.0, 29.0, 24.0, 22.0, 17.0, 10.0, 3.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.691131591796875, -2.60882568359375, -2.526519775390625, -2.4442138671875, -2.361907958984375, -2.27960205078125, -2.197296142578125, -2.114990234375, -2.032684326171875, -1.95037841796875, -1.868072509765625, -1.7857666015625, -1.703460693359375, -1.62115478515625, -1.538848876953125, -1.45654296875, -1.374237060546875, -1.29193115234375, -1.209625244140625, -1.1273193359375, -1.045013427734375, -0.96270751953125, -0.880401611328125, -0.798095703125, -0.715789794921875, -0.63348388671875, -0.551177978515625, -0.4688720703125, -0.386566162109375, -0.30426025390625, -0.221954345703125, -0.1396484375, -0.057342529296875, 0.02496337890625, 0.107269287109375, 0.1895751953125, 0.271881103515625, 0.35418701171875, 0.436492919921875, 0.518798828125, 0.601104736328125, 0.68341064453125, 0.765716552734375, 0.8480224609375, 0.930328369140625, 1.01263427734375, 1.094940185546875, 1.17724609375, 1.259552001953125, 1.34185791015625, 1.424163818359375, 1.5064697265625, 1.588775634765625, 1.67108154296875, 1.753387451171875, 1.835693359375, 1.917999267578125, 2.00030517578125, 2.082611083984375, 2.1649169921875, 2.247222900390625, 2.32952880859375, 2.411834716796875, 2.494140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 5.0, 19.0, 23.0, 43.0, 65.0, 110.0, 171.0, 324.0, 553.0, 1061.0, 1866.0, 3534.0, 7058.0, 15404.0, 45879.0, 257878.0, 564194.0, 103980.0, 25249.0, 10286.0, 4982.0, 2546.0, 1390.0, 818.0, 465.0, 253.0, 134.0, 75.0, 54.0, 36.0, 30.0, 14.0, 9.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.295654296875, -28.29443359375, -27.293212890625, -26.2919921875, -25.290771484375, -24.28955078125, -23.288330078125, -22.287109375, -21.285888671875, -20.28466796875, -19.283447265625, -18.2822265625, -17.281005859375, -16.27978515625, -15.278564453125, -14.27734375, -13.276123046875, -12.27490234375, -11.273681640625, -10.2724609375, -9.271240234375, -8.27001953125, -7.268798828125, -6.267578125, -5.266357421875, -4.26513671875, -3.263916015625, -2.2626953125, -1.261474609375, -0.26025390625, 0.740966796875, 1.7421875, 2.743408203125, 3.74462890625, 4.745849609375, 5.7470703125, 6.748291015625, 7.74951171875, 8.750732421875, 9.751953125, 10.753173828125, 11.75439453125, 12.755615234375, 13.7568359375, 14.758056640625, 15.75927734375, 16.760498046875, 17.76171875, 18.762939453125, 19.76416015625, 20.765380859375, 21.7666015625, 22.767822265625, 23.76904296875, 24.770263671875, 25.771484375, 26.772705078125, 27.77392578125, 28.775146484375, 29.7763671875, 30.777587890625, 31.77880859375, 32.780029296875, 33.78125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 14.0, 16.0, 16.0, 23.0, 25.0, 41.0, 36.0, 32.0, 43.0, 36.0, 42.0, 49.0, 60.0, 50.0, 28.0, 45.0, 33.0, 48.0, 46.0, 55.0, 32.0, 27.0, 27.0, 30.0, 13.0, 16.0, 14.0, 7.0, 11.0, 7.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2578125, -14.7589111328125, -14.260009765625, -13.7611083984375, -13.26220703125, -12.7633056640625, -12.264404296875, -11.7655029296875, -11.2666015625, -10.7677001953125, -10.268798828125, -9.7698974609375, -9.27099609375, -8.7720947265625, -8.273193359375, -7.7742919921875, -7.275390625, -6.7764892578125, -6.277587890625, -5.7786865234375, -5.27978515625, -4.7808837890625, -4.281982421875, -3.7830810546875, -3.2841796875, -2.7852783203125, -2.286376953125, -1.7874755859375, -1.28857421875, -0.7896728515625, -0.290771484375, 0.2081298828125, 0.70703125, 1.2059326171875, 1.704833984375, 2.2037353515625, 2.70263671875, 3.2015380859375, 3.700439453125, 4.1993408203125, 4.6982421875, 5.1971435546875, 5.696044921875, 6.1949462890625, 6.69384765625, 7.1927490234375, 7.691650390625, 8.1905517578125, 8.689453125, 9.1883544921875, 9.687255859375, 10.1861572265625, 10.68505859375, 11.1839599609375, 11.682861328125, 12.1817626953125, 12.6806640625, 13.1795654296875, 13.678466796875, 14.1773681640625, 14.67626953125, 15.1751708984375, 15.674072265625, 16.1729736328125, 16.671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 33.0, 27.0, 66.0, 81.0, 172.0, 258.0, 482.0, 1001.0, 2461.0, 8422.0, 48094.0, 822744.0, 143427.0, 14410.0, 3862.0, 1460.0, 621.0, 337.0, 205.0, 119.0, 60.0, 38.0, 22.0, 25.0, 16.0, 13.0, 7.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-72.9375, -70.8349609375, -68.732421875, -66.6298828125, -64.52734375, -62.4248046875, -60.322265625, -58.2197265625, -56.1171875, -54.0146484375, -51.912109375, -49.8095703125, -47.70703125, -45.6044921875, -43.501953125, -41.3994140625, -39.296875, -37.1943359375, -35.091796875, -32.9892578125, -30.88671875, -28.7841796875, -26.681640625, -24.5791015625, -22.4765625, -20.3740234375, -18.271484375, -16.1689453125, -14.06640625, -11.9638671875, -9.861328125, -7.7587890625, -5.65625, -3.5537109375, -1.451171875, 0.6513671875, 2.75390625, 4.8564453125, 6.958984375, 9.0615234375, 11.1640625, 13.2666015625, 15.369140625, 17.4716796875, 19.57421875, 21.6767578125, 23.779296875, 25.8818359375, 27.984375, 30.0869140625, 32.189453125, 34.2919921875, 36.39453125, 38.4970703125, 40.599609375, 42.7021484375, 44.8046875, 46.9072265625, 49.009765625, 51.1123046875, 53.21484375, 55.3173828125, 57.419921875, 59.5224609375, 61.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 11.0, 14.0, 9.0, 13.0, 16.0, 32.0, 58.0, 69.0, 135.0, 192.0, 153.0, 115.0, 65.0, 41.0, 26.0, 18.0, 6.0, 8.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00525665283203125, -0.005105137825012207, -0.004953622817993164, -0.004802107810974121, -0.004650592803955078, -0.004499077796936035, -0.004347562789916992, -0.004196047782897949, -0.004044532775878906, -0.0038930177688598633, -0.0037415027618408203, -0.0035899877548217773, -0.0034384727478027344, -0.0032869577407836914, -0.0031354427337646484, -0.0029839277267456055, -0.0028324127197265625, -0.0026808977127075195, -0.0025293827056884766, -0.0023778676986694336, -0.0022263526916503906, -0.0020748376846313477, -0.0019233226776123047, -0.0017718076705932617, -0.0016202926635742188, -0.0014687776565551758, -0.0013172626495361328, -0.0011657476425170898, -0.0010142326354980469, -0.0008627176284790039, -0.0007112026214599609, -0.000559687614440918, -0.000408172607421875, -0.00025665760040283203, -0.00010514259338378906, 4.6372413635253906e-05, 0.00019788742065429688, 0.00034940242767333984, 0.0005009174346923828, 0.0006524324417114258, 0.0008039474487304688, 0.0009554624557495117, 0.0011069774627685547, 0.0012584924697875977, 0.0014100074768066406, 0.0015615224838256836, 0.0017130374908447266, 0.0018645524978637695, 0.0020160675048828125, 0.0021675825119018555, 0.0023190975189208984, 0.0024706125259399414, 0.0026221275329589844, 0.0027736425399780273, 0.0029251575469970703, 0.0030766725540161133, 0.0032281875610351562, 0.0033797025680541992, 0.003531217575073242, 0.003682732582092285, 0.003834247589111328, 0.003985762596130371, 0.004137277603149414, 0.004288792610168457, 0.0044403076171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 2.0, 20.0, 14.0, 29.0, 13.0, 51.0, 91.0, 182.0, 327.0, 820.0, 2665.0, 14653.0, 484495.0, 525744.0, 15086.0, 2786.0, 814.0, 351.0, 167.0, 88.0, 47.0, 36.0, 25.0, 14.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.93701171875, -57.7177734375, -55.49853515625, -53.279296875, -51.06005859375, -48.8408203125, -46.62158203125, -44.40234375, -42.18310546875, -39.9638671875, -37.74462890625, -35.525390625, -33.30615234375, -31.0869140625, -28.86767578125, -26.6484375, -24.42919921875, -22.2099609375, -19.99072265625, -17.771484375, -15.55224609375, -13.3330078125, -11.11376953125, -8.89453125, -6.67529296875, -4.4560546875, -2.23681640625, -0.017578125, 2.20166015625, 4.4208984375, 6.64013671875, 8.859375, 11.07861328125, 13.2978515625, 15.51708984375, 17.736328125, 19.95556640625, 22.1748046875, 24.39404296875, 26.61328125, 28.83251953125, 31.0517578125, 33.27099609375, 35.490234375, 37.70947265625, 39.9287109375, 42.14794921875, 44.3671875, 46.58642578125, 48.8056640625, 51.02490234375, 53.244140625, 55.46337890625, 57.6826171875, 59.90185546875, 62.12109375, 64.34033203125, 66.5595703125, 68.77880859375, 70.998046875, 73.21728515625, 75.4365234375, 77.65576171875, 79.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 16.0, 16.0, 39.0, 85.0, 148.0, 195.0, 207.0, 145.0, 75.0, 28.0, 18.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3125, -31.1923828125, -30.072265625, -28.9521484375, -27.83203125, -26.7119140625, -25.591796875, -24.4716796875, -23.3515625, -22.2314453125, -21.111328125, -19.9912109375, -18.87109375, -17.7509765625, -16.630859375, -15.5107421875, -14.390625, -13.2705078125, -12.150390625, -11.0302734375, -9.91015625, -8.7900390625, -7.669921875, -6.5498046875, -5.4296875, -4.3095703125, -3.189453125, -2.0693359375, -0.94921875, 0.1708984375, 1.291015625, 2.4111328125, 3.53125, 4.6513671875, 5.771484375, 6.8916015625, 8.01171875, 9.1318359375, 10.251953125, 11.3720703125, 12.4921875, 13.6123046875, 14.732421875, 15.8525390625, 16.97265625, 18.0927734375, 19.212890625, 20.3330078125, 21.453125, 22.5732421875, 23.693359375, 24.8134765625, 25.93359375, 27.0537109375, 28.173828125, 29.2939453125, 30.4140625, 31.5341796875, 32.654296875, 33.7744140625, 34.89453125, 36.0146484375, 37.134765625, 38.2548828125, 39.375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 35.0, 55.0, 103.0, 223.0, 246.0, 149.0, 59.0, 20.0, 17.0, 8.0, 12.0, 3.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.4444274902344, -383.82470703125, -373.2049560546875, -362.5852355957031, -351.9654846191406, -341.34576416015625, -330.72601318359375, -320.1062927246094, -309.486572265625, -298.8668518066406, -288.2471008300781, -277.62738037109375, -267.00762939453125, -256.3879089355469, -245.76817321777344, -235.1484375, -224.52870178222656, -213.90896606445312, -203.2892303466797, -192.66949462890625, -182.04977416992188, -171.43003845214844, -160.810302734375, -150.19058227539062, -139.57083129882812, -128.9510955810547, -118.33136749267578, -107.71163177490234, -97.09190368652344, -86.47216796875, -75.85243225097656, -65.23270416259766, -54.61297607421875, -43.99324417114258, -33.373512268066406, -22.75377655029297, -12.134044647216797, -1.514312744140625, 9.105422973632812, 19.72515106201172, 30.344886779785156, 40.96461868286133, 51.5843505859375, 62.20408630371094, 72.82382202148438, 83.44355010986328, 94.06328582763672, 104.68301391601562, 115.30274963378906, 125.9224853515625, 136.54222106933594, 147.16195678710938, 157.78167724609375, 168.4014129638672, 179.02114868164062, 189.640869140625, 200.2606201171875, 210.88035583496094, 221.50009155273438, 232.11981201171875, 242.7395477294922, 253.35928344726562, 263.97900390625, 274.5987548828125, 285.2184753417969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 9.0, 31.0, 35.0, 59.0, 104.0, 140.0, 171.0, 135.0, 91.0, 70.0, 35.0, 18.0, 11.0, 11.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5455627441406, -280.0285339355469, -270.511474609375, -260.99444580078125, -251.4774169921875, -241.96038818359375, -232.44334411621094, -222.92630004882812, -213.40927124023438, -203.89224243164062, -194.3751983642578, -184.858154296875, -175.34112548828125, -165.8240966796875, -156.3070526123047, -146.79000854492188, -137.27297973632812, -127.75594329833984, -118.23890686035156, -108.72187042236328, -99.204833984375, -89.68779754638672, -80.17076110839844, -70.65372467041016, -61.136688232421875, -51.619651794433594, -42.10261535644531, -32.58557891845703, -23.06854248046875, -13.551506042480469, -4.0344696044921875, 5.482566833496094, 14.999603271484375, 24.516639709472656, 34.03367614746094, 43.55071258544922, 53.0677490234375, 62.58478546142578, 72.10182189941406, 81.61885833740234, 91.13589477539062, 100.6529312133789, 110.16996765136719, 119.68700408935547, 129.20404052734375, 138.7210693359375, 148.2381134033203, 157.75515747070312, 167.27218627929688, 176.78921508789062, 186.30625915527344, 195.82330322265625, 205.34033203125, 214.85736083984375, 224.37440490722656, 233.89144897460938, 243.40847778320312, 252.92550659179688, 262.44256591796875, 271.9595947265625, 281.47662353515625, 290.99365234375, 300.51068115234375, 310.0277404785156, 319.5447692871094]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 12.0, 17.0, 16.0, 27.0, 29.0, 34.0, 58.0, 66.0, 117.0, 130.0, 231.0, 312.0, 571.0, 1040.0, 1726.0, 3427.0, 7012.0, 17711.0, 55880.0, 322847.0, 3562003.0, 164426.0, 35870.0, 11529.0, 4567.0, 2101.0, 1008.0, 593.0, 333.0, 220.0, 119.0, 76.0, 44.0, 38.0, 23.0, 24.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.1484375, -64.859375, -62.5703125, -60.28125, -57.9921875, -55.703125, -53.4140625, -51.125, -48.8359375, -46.546875, -44.2578125, -41.96875, -39.6796875, -37.390625, -35.1015625, -32.8125, -30.5234375, -28.234375, -25.9453125, -23.65625, -21.3671875, -19.078125, -16.7890625, -14.5, -12.2109375, -9.921875, -7.6328125, -5.34375, -3.0546875, -0.765625, 1.5234375, 3.8125, 6.1015625, 8.390625, 10.6796875, 12.96875, 15.2578125, 17.546875, 19.8359375, 22.125, 24.4140625, 26.703125, 28.9921875, 31.28125, 33.5703125, 35.859375, 38.1484375, 40.4375, 42.7265625, 45.015625, 47.3046875, 49.59375, 51.8828125, 54.171875, 56.4609375, 58.75, 61.0390625, 63.328125, 65.6171875, 67.90625, 70.1953125, 72.484375, 74.7734375, 77.0625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 23.0, 22.0, 28.0, 32.0, 59.0, 62.0, 69.0, 87.0, 91.0, 90.0, 68.0, 69.0, 56.0, 52.0, 38.0, 23.0, 18.0, 18.0, 8.0, 6.0, 15.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.32421875, -3.23309326171875, -3.1419677734375, -3.05084228515625, -2.959716796875, -2.86859130859375, -2.7774658203125, -2.68634033203125, -2.59521484375, -2.50408935546875, -2.4129638671875, -2.32183837890625, -2.230712890625, -2.13958740234375, -2.0484619140625, -1.95733642578125, -1.8662109375, -1.77508544921875, -1.6839599609375, -1.59283447265625, -1.501708984375, -1.41058349609375, -1.3194580078125, -1.22833251953125, -1.13720703125, -1.04608154296875, -0.9549560546875, -0.86383056640625, -0.772705078125, -0.68157958984375, -0.5904541015625, -0.49932861328125, -0.408203125, -0.31707763671875, -0.2259521484375, -0.13482666015625, -0.043701171875, 0.04742431640625, 0.1385498046875, 0.22967529296875, 0.32080078125, 0.41192626953125, 0.5030517578125, 0.59417724609375, 0.685302734375, 0.77642822265625, 0.8675537109375, 0.95867919921875, 1.0498046875, 1.14093017578125, 1.2320556640625, 1.32318115234375, 1.414306640625, 1.50543212890625, 1.5965576171875, 1.68768310546875, 1.77880859375, 1.86993408203125, 1.9610595703125, 2.05218505859375, 2.143310546875, 2.23443603515625, 2.3255615234375, 2.41668701171875, 2.5078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 19.0, 44.0, 83.0, 184.0, 305.0, 738.0, 1849.0, 6324.0, 31292.0, 249216.0, 3414587.0, 429314.0, 47003.0, 9105.0, 2504.0, 845.0, 407.0, 178.0, 87.0, 57.0, 48.0, 20.0, 5.0, 11.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -46.7724609375, -44.607421875, -42.4423828125, -40.27734375, -38.1123046875, -35.947265625, -33.7822265625, -31.6171875, -29.4521484375, -27.287109375, -25.1220703125, -22.95703125, -20.7919921875, -18.626953125, -16.4619140625, -14.296875, -12.1318359375, -9.966796875, -7.8017578125, -5.63671875, -3.4716796875, -1.306640625, 0.8583984375, 3.0234375, 5.1884765625, 7.353515625, 9.5185546875, 11.68359375, 13.8486328125, 16.013671875, 18.1787109375, 20.34375, 22.5087890625, 24.673828125, 26.8388671875, 29.00390625, 31.1689453125, 33.333984375, 35.4990234375, 37.6640625, 39.8291015625, 41.994140625, 44.1591796875, 46.32421875, 48.4892578125, 50.654296875, 52.8193359375, 54.984375, 57.1494140625, 59.314453125, 61.4794921875, 63.64453125, 65.8095703125, 67.974609375, 70.1396484375, 72.3046875, 74.4697265625, 76.634765625, 78.7998046875, 80.96484375, 83.1298828125, 85.294921875, 87.4599609375, 89.625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 12.0, 10.0, 15.0, 21.0, 34.0, 27.0, 60.0, 72.0, 91.0, 169.0, 257.0, 342.0, 791.0, 977.0, 391.0, 211.0, 152.0, 110.0, 84.0, 67.0, 35.0, 27.0, 26.0, 26.0, 14.0, 12.0, 5.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640625, -6.4266357421875, -6.212646484375, -5.9986572265625, -5.78466796875, -5.5706787109375, -5.356689453125, -5.1427001953125, -4.9287109375, -4.7147216796875, -4.500732421875, -4.2867431640625, -4.07275390625, -3.8587646484375, -3.644775390625, -3.4307861328125, -3.216796875, -3.0028076171875, -2.788818359375, -2.5748291015625, -2.36083984375, -2.1468505859375, -1.932861328125, -1.7188720703125, -1.5048828125, -1.2908935546875, -1.076904296875, -0.8629150390625, -0.64892578125, -0.4349365234375, -0.220947265625, -0.0069580078125, 0.20703125, 0.4210205078125, 0.635009765625, 0.8489990234375, 1.06298828125, 1.2769775390625, 1.490966796875, 1.7049560546875, 1.9189453125, 2.1329345703125, 2.346923828125, 2.5609130859375, 2.77490234375, 2.9888916015625, 3.202880859375, 3.4168701171875, 3.630859375, 3.8448486328125, 4.058837890625, 4.2728271484375, 4.48681640625, 4.7008056640625, 4.914794921875, 5.1287841796875, 5.3427734375, 5.5567626953125, 5.770751953125, 5.9847412109375, 6.19873046875, 6.4127197265625, 6.626708984375, 6.8406982421875, 7.0546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 12.0, 11.0, 20.0, 42.0, 111.0, 139.0, 193.0, 199.0, 108.0, 82.0, 38.0, 13.0, 10.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.86197662353516, -87.64466857910156, -85.4273681640625, -83.2100601196289, -80.99275970458984, -78.77545166015625, -76.55815124511719, -74.3408432006836, -72.12353515625, -69.9062271118164, -67.68892669677734, -65.47161865234375, -63.25431823730469, -61.037010192871094, -58.819705963134766, -56.60240173339844, -54.385101318359375, -52.16779708862305, -49.95049285888672, -47.73318862915039, -45.51588439941406, -43.29857635498047, -41.08127212524414, -38.86396789550781, -36.646663665771484, -34.429359436035156, -32.21205520629883, -29.994749069213867, -27.77744483947754, -25.56014060974121, -23.34283447265625, -21.125530242919922, -18.90822982788086, -16.69092559814453, -14.473620414733887, -12.256315231323242, -10.039011001586914, -7.821706771850586, -5.604401588439941, -3.387096405029297, -1.1697921752929688, 1.0475125312805176, 3.264817237854004, 5.48212194442749, 7.699426651000977, 9.916730880737305, 12.13403606414795, 14.351341247558594, 16.568645477294922, 18.78594970703125, 21.003253936767578, 23.22056007385254, 25.437864303588867, 27.655168533325195, 29.872474670410156, 32.089778900146484, 34.30708312988281, 36.52438735961914, 38.74169158935547, 40.9589958190918, 43.176300048828125, 45.39360809326172, 47.61091232299805, 49.828216552734375, 52.0455207824707]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 18.0, 21.0, 21.0, 35.0, 45.0, 52.0, 47.0, 63.0, 64.0, 70.0, 72.0, 71.0, 68.0, 52.0, 58.0, 39.0, 30.0, 30.0, 13.0, 21.0, 18.0, 12.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.05409240722656, -38.81858444213867, -37.583072662353516, -36.347564697265625, -35.112056732177734, -33.87654495239258, -32.64103698730469, -31.405527114868164, -30.17001724243164, -28.934507369995117, -27.698999404907227, -26.463489532470703, -25.22797966003418, -23.992469787597656, -22.756961822509766, -21.521451950073242, -20.28594398498535, -19.050434112548828, -17.814926147460938, -16.579416275024414, -15.34390640258789, -14.108397483825684, -12.872888565063477, -11.637378692626953, -10.401869773864746, -9.166360855102539, -7.930850982666016, -6.695342063903809, -5.459832668304443, -4.224323272705078, -2.988814353942871, -1.7533044815063477, -0.5177955627441406, 0.7177137136459351, 1.9532229900360107, 3.188732147216797, 4.424241542816162, 5.659750938415527, 6.895259857177734, 8.130769729614258, 9.366278648376465, 10.601787567138672, 11.837297439575195, 13.072806358337402, 14.30831527709961, 15.543825149536133, 16.779335021972656, 18.014842987060547, 19.25035285949707, 20.485862731933594, 21.721370697021484, 22.956880569458008, 24.19239044189453, 25.427898406982422, 26.663408279418945, 27.89891815185547, 29.13442611694336, 30.369935989379883, 31.605443954467773, 32.8409538269043, 34.07646179199219, 35.311973571777344, 36.547481536865234, 37.782989501953125, 39.01850128173828]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 25.0, 40.0, 46.0, 90.0, 120.0, 238.0, 444.0, 757.0, 1428.0, 2633.0, 5027.0, 10306.0, 21847.0, 49668.0, 119740.0, 280112.0, 309627.0, 140089.0, 57074.0, 25276.0, 11755.0, 5737.0, 2960.0, 1543.0, 847.0, 442.0, 294.0, 151.0, 94.0, 46.0, 34.0, 27.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.359375, -22.693603515625, -22.02783203125, -21.362060546875, -20.6962890625, -20.030517578125, -19.36474609375, -18.698974609375, -18.033203125, -17.367431640625, -16.70166015625, -16.035888671875, -15.3701171875, -14.704345703125, -14.03857421875, -13.372802734375, -12.70703125, -12.041259765625, -11.37548828125, -10.709716796875, -10.0439453125, -9.378173828125, -8.71240234375, -8.046630859375, -7.380859375, -6.715087890625, -6.04931640625, -5.383544921875, -4.7177734375, -4.052001953125, -3.38623046875, -2.720458984375, -2.0546875, -1.388916015625, -0.72314453125, -0.057373046875, 0.6083984375, 1.274169921875, 1.93994140625, 2.605712890625, 3.271484375, 3.937255859375, 4.60302734375, 5.268798828125, 5.9345703125, 6.600341796875, 7.26611328125, 7.931884765625, 8.59765625, 9.263427734375, 9.92919921875, 10.594970703125, 11.2607421875, 11.926513671875, 12.59228515625, 13.258056640625, 13.923828125, 14.589599609375, 15.25537109375, 15.921142578125, 16.5869140625, 17.252685546875, 17.91845703125, 18.584228515625, 19.25]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 2.0, 8.0, 5.0, 11.0, 12.0, 15.0, 21.0, 16.0, 14.0, 18.0, 36.0, 25.0, 41.0, 40.0, 44.0, 46.0, 54.0, 50.0, 42.0, 50.0, 64.0, 45.0, 40.0, 44.0, 37.0, 37.0, 25.0, 17.0, 23.0, 25.0, 13.0, 17.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.9013671875, -1.8409271240234375, -1.780487060546875, -1.7200469970703125, -1.65960693359375, -1.5991668701171875, -1.538726806640625, -1.4782867431640625, -1.4178466796875, -1.3574066162109375, -1.296966552734375, -1.2365264892578125, -1.17608642578125, -1.1156463623046875, -1.055206298828125, -0.9947662353515625, -0.934326171875, -0.8738861083984375, -0.813446044921875, -0.7530059814453125, -0.69256591796875, -0.6321258544921875, -0.571685791015625, -0.5112457275390625, -0.4508056640625, -0.3903656005859375, -0.329925537109375, -0.2694854736328125, -0.20904541015625, -0.1486053466796875, -0.088165283203125, -0.0277252197265625, 0.03271484375, 0.0931549072265625, 0.153594970703125, 0.2140350341796875, 0.27447509765625, 0.3349151611328125, 0.395355224609375, 0.4557952880859375, 0.5162353515625, 0.5766754150390625, 0.637115478515625, 0.6975555419921875, 0.75799560546875, 0.8184356689453125, 0.878875732421875, 0.9393157958984375, 0.999755859375, 1.0601959228515625, 1.120635986328125, 1.1810760498046875, 1.24151611328125, 1.3019561767578125, 1.362396240234375, 1.4228363037109375, 1.4832763671875, 1.5437164306640625, 1.604156494140625, 1.6645965576171875, 1.72503662109375, 1.7854766845703125, 1.845916748046875, 1.9063568115234375, 1.966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 11.0, 15.0, 28.0, 75.0, 157.0, 430.0, 1347.0, 5086.0, 24362.0, 160063.0, 662916.0, 161562.0, 25059.0, 5258.0, 1374.0, 454.0, 164.0, 90.0, 40.0, 22.0, 14.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.03125, -29.90283203125, -28.7744140625, -27.64599609375, -26.517578125, -25.38916015625, -24.2607421875, -23.13232421875, -22.00390625, -20.87548828125, -19.7470703125, -18.61865234375, -17.490234375, -16.36181640625, -15.2333984375, -14.10498046875, -12.9765625, -11.84814453125, -10.7197265625, -9.59130859375, -8.462890625, -7.33447265625, -6.2060546875, -5.07763671875, -3.94921875, -2.82080078125, -1.6923828125, -0.56396484375, 0.564453125, 1.69287109375, 2.8212890625, 3.94970703125, 5.078125, 6.20654296875, 7.3349609375, 8.46337890625, 9.591796875, 10.72021484375, 11.8486328125, 12.97705078125, 14.10546875, 15.23388671875, 16.3623046875, 17.49072265625, 18.619140625, 19.74755859375, 20.8759765625, 22.00439453125, 23.1328125, 24.26123046875, 25.3896484375, 26.51806640625, 27.646484375, 28.77490234375, 29.9033203125, 31.03173828125, 32.16015625, 33.28857421875, 34.4169921875, 35.54541015625, 36.673828125, 37.80224609375, 38.9306640625, 40.05908203125, 41.1875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 12.0, 13.0, 15.0, 25.0, 18.0, 16.0, 20.0, 29.0, 30.0, 28.0, 27.0, 37.0, 26.0, 34.0, 37.0, 41.0, 54.0, 47.0, 39.0, 44.0, 37.0, 37.0, 38.0, 26.0, 29.0, 24.0, 23.0, 22.0, 23.0, 14.0, 15.0, 18.0, 11.0, 11.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.625, -10.297119140625, -9.96923828125, -9.641357421875, -9.3134765625, -8.985595703125, -8.65771484375, -8.329833984375, -8.001953125, -7.674072265625, -7.34619140625, -7.018310546875, -6.6904296875, -6.362548828125, -6.03466796875, -5.706787109375, -5.37890625, -5.051025390625, -4.72314453125, -4.395263671875, -4.0673828125, -3.739501953125, -3.41162109375, -3.083740234375, -2.755859375, -2.427978515625, -2.10009765625, -1.772216796875, -1.4443359375, -1.116455078125, -0.78857421875, -0.460693359375, -0.1328125, 0.195068359375, 0.52294921875, 0.850830078125, 1.1787109375, 1.506591796875, 1.83447265625, 2.162353515625, 2.490234375, 2.818115234375, 3.14599609375, 3.473876953125, 3.8017578125, 4.129638671875, 4.45751953125, 4.785400390625, 5.11328125, 5.441162109375, 5.76904296875, 6.096923828125, 6.4248046875, 6.752685546875, 7.08056640625, 7.408447265625, 7.736328125, 8.064208984375, 8.39208984375, 8.719970703125, 9.0478515625, 9.375732421875, 9.70361328125, 10.031494140625, 10.359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 11.0, 14.0, 23.0, 32.0, 63.0, 167.0, 395.0, 1006.0, 2956.0, 12642.0, 105324.0, 820626.0, 89522.0, 11428.0, 2785.0, 895.0, 353.0, 138.0, 73.0, 38.0, 22.0, 21.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-87.8125, -85.9228515625, -84.033203125, -82.1435546875, -80.25390625, -78.3642578125, -76.474609375, -74.5849609375, -72.6953125, -70.8056640625, -68.916015625, -67.0263671875, -65.13671875, -63.2470703125, -61.357421875, -59.4677734375, -57.578125, -55.6884765625, -53.798828125, -51.9091796875, -50.01953125, -48.1298828125, -46.240234375, -44.3505859375, -42.4609375, -40.5712890625, -38.681640625, -36.7919921875, -34.90234375, -33.0126953125, -31.123046875, -29.2333984375, -27.34375, -25.4541015625, -23.564453125, -21.6748046875, -19.78515625, -17.8955078125, -16.005859375, -14.1162109375, -12.2265625, -10.3369140625, -8.447265625, -6.5576171875, -4.66796875, -2.7783203125, -0.888671875, 1.0009765625, 2.890625, 4.7802734375, 6.669921875, 8.5595703125, 10.44921875, 12.3388671875, 14.228515625, 16.1181640625, 18.0078125, 19.8974609375, 21.787109375, 23.6767578125, 25.56640625, 27.4560546875, 29.345703125, 31.2353515625, 33.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 11.0, 13.0, 17.0, 36.0, 49.0, 75.0, 124.0, 195.0, 156.0, 123.0, 67.0, 49.0, 26.0, 16.0, 5.0, 4.0, 9.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002899169921875, -0.002813190221786499, -0.002727210521697998, -0.002641230821609497, -0.002555251121520996, -0.002469271421432495, -0.002383291721343994, -0.002297312021255493, -0.002211332321166992, -0.002125352621078491, -0.0020393729209899902, -0.0019533932209014893, -0.0018674135208129883, -0.0017814338207244873, -0.0016954541206359863, -0.0016094744205474854, -0.0015234947204589844, -0.0014375150203704834, -0.0013515353202819824, -0.0012655556201934814, -0.0011795759201049805, -0.0010935962200164795, -0.0010076165199279785, -0.0009216368198394775, -0.0008356571197509766, -0.0007496774196624756, -0.0006636977195739746, -0.0005777180194854736, -0.0004917383193969727, -0.0004057586193084717, -0.0003197789192199707, -0.00023379921913146973, -0.00014781951904296875, -6.183981895446777e-05, 2.4139881134033203e-05, 0.00011011958122253418, 0.00019609928131103516, 0.00028207898139953613, 0.0003680586814880371, 0.0004540383815765381, 0.0005400180816650391, 0.00062599778175354, 0.000711977481842041, 0.000797957181930542, 0.000883936882019043, 0.0009699165821075439, 0.001055896282196045, 0.001141875982284546, 0.0012278556823730469, 0.0013138353824615479, 0.0013998150825500488, 0.0014857947826385498, 0.0015717744827270508, 0.0016577541828155518, 0.0017437338829040527, 0.0018297135829925537, 0.0019156932830810547, 0.0020016729831695557, 0.0020876526832580566, 0.0021736323833465576, 0.0022596120834350586, 0.0023455917835235596, 0.0024315714836120605, 0.0025175511837005615, 0.0026035308837890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 16.0, 14.0, 29.0, 29.0, 44.0, 64.0, 100.0, 145.0, 209.0, 330.0, 489.0, 830.0, 1295.0, 2275.0, 3955.0, 7536.0, 15347.0, 36089.0, 107575.0, 355980.0, 344240.0, 103677.0, 35351.0, 15104.0, 7298.0, 4146.0, 2367.0, 1434.0, 831.0, 552.0, 361.0, 242.0, 171.0, 121.0, 80.0, 59.0, 50.0, 28.0, 22.0, 17.0, 15.0, 11.0, 4.0, 5.0, 6.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.347900390625, -16.68017578125, -16.012451171875, -15.3447265625, -14.677001953125, -14.00927734375, -13.341552734375, -12.673828125, -12.006103515625, -11.33837890625, -10.670654296875, -10.0029296875, -9.335205078125, -8.66748046875, -7.999755859375, -7.33203125, -6.664306640625, -5.99658203125, -5.328857421875, -4.6611328125, -3.993408203125, -3.32568359375, -2.657958984375, -1.990234375, -1.322509765625, -0.65478515625, 0.012939453125, 0.6806640625, 1.348388671875, 2.01611328125, 2.683837890625, 3.3515625, 4.019287109375, 4.68701171875, 5.354736328125, 6.0224609375, 6.690185546875, 7.35791015625, 8.025634765625, 8.693359375, 9.361083984375, 10.02880859375, 10.696533203125, 11.3642578125, 12.031982421875, 12.69970703125, 13.367431640625, 14.03515625, 14.702880859375, 15.37060546875, 16.038330078125, 16.7060546875, 17.373779296875, 18.04150390625, 18.709228515625, 19.376953125, 20.044677734375, 20.71240234375, 21.380126953125, 22.0478515625, 22.715576171875, 23.38330078125, 24.051025390625, 24.71875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 4.0, 10.0, 12.0, 13.0, 18.0, 18.0, 27.0, 30.0, 55.0, 76.0, 84.0, 101.0, 106.0, 95.0, 75.0, 68.0, 43.0, 34.0, 30.0, 20.0, 11.0, 8.0, 12.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.6593017578125, -11.107666015625, -10.5560302734375, -10.00439453125, -9.4527587890625, -8.901123046875, -8.3494873046875, -7.7978515625, -7.2462158203125, -6.694580078125, -6.1429443359375, -5.59130859375, -5.0396728515625, -4.488037109375, -3.9364013671875, -3.384765625, -2.8331298828125, -2.281494140625, -1.7298583984375, -1.17822265625, -0.6265869140625, -0.074951171875, 0.4766845703125, 1.0283203125, 1.5799560546875, 2.131591796875, 2.6832275390625, 3.23486328125, 3.7864990234375, 4.338134765625, 4.8897705078125, 5.44140625, 5.9930419921875, 6.544677734375, 7.0963134765625, 7.64794921875, 8.1995849609375, 8.751220703125, 9.3028564453125, 9.8544921875, 10.4061279296875, 10.957763671875, 11.5093994140625, 12.06103515625, 12.6126708984375, 13.164306640625, 13.7159423828125, 14.267578125, 14.8192138671875, 15.370849609375, 15.9224853515625, 16.47412109375, 17.0257568359375, 17.577392578125, 18.1290283203125, 18.6806640625, 19.2322998046875, 19.783935546875, 20.3355712890625, 20.88720703125, 21.4388427734375, 21.990478515625, 22.5421142578125, 23.09375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 14.0, 29.0, 45.0, 88.0, 159.0, 206.0, 191.0, 115.0, 67.0, 33.0, 14.0, 5.0, 7.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.4331817626953, -153.01084899902344, -146.58851623535156, -140.1661834716797, -133.74383544921875, -127.3215103149414, -120.899169921875, -114.47683715820312, -108.05450439453125, -101.63217163085938, -95.2098388671875, -88.7874984741211, -82.36516571044922, -75.94283294677734, -69.52049255371094, -63.09815979003906, -56.67582702636719, -50.25349426269531, -43.83115768432617, -37.40882110595703, -30.986488342285156, -24.56415557861328, -18.14181900024414, -11.719482421875, -5.297149658203125, 1.1251850128173828, 7.547519683837891, 13.969854354858398, 20.392189025878906, 26.81452178955078, 33.23685836791992, 39.65919494628906, 46.081512451171875, 52.50384521484375, 58.92618179321289, 65.34851837158203, 71.7708511352539, 78.19318389892578, 84.61552429199219, 91.03785705566406, 97.46018981933594, 103.88252258300781, 110.30485534667969, 116.7271957397461, 123.14952850341797, 129.57186889648438, 135.99420166015625, 142.41653442382812, 148.8388671875, 155.26119995117188, 161.68353271484375, 168.10586547851562, 174.5281982421875, 180.95053100585938, 187.3728790283203, 193.7952117919922, 200.21754455566406, 206.63987731933594, 213.0622100830078, 219.4845428466797, 225.90689086914062, 232.3292236328125, 238.75155639648438, 245.17388916015625, 251.59622192382812]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 14.0, 13.0, 15.0, 19.0, 29.0, 41.0, 37.0, 50.0, 52.0, 70.0, 77.0, 100.0, 73.0, 82.0, 76.0, 52.0, 41.0, 30.0, 27.0, 19.0, 13.0, 9.0, 10.0, 5.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-132.16354370117188, -127.71258544921875, -123.26162719726562, -118.8106689453125, -114.35971069335938, -109.90875244140625, -105.45779418945312, -101.0068359375, -96.55587768554688, -92.10491943359375, -87.65396118164062, -83.2030029296875, -78.75204467773438, -74.30108642578125, -69.85012817382812, -65.399169921875, -60.948211669921875, -56.49725341796875, -52.046295166015625, -47.5953369140625, -43.144378662109375, -38.69342041015625, -34.242462158203125, -29.79150390625, -25.340545654296875, -20.88958740234375, -16.438629150390625, -11.9876708984375, -7.536712646484375, -3.08575439453125, 1.365203857421875, 5.816162109375, 10.267135620117188, 14.718093872070312, 19.169052124023438, 23.620010375976562, 28.070968627929688, 32.52192687988281, 36.97288513183594, 41.42384338378906, 45.87480163574219, 50.32575988769531, 54.77671813964844, 59.22767639160156, 63.67863464355469, 68.12959289550781, 72.58055114746094, 77.03150939941406, 81.48246765136719, 85.93342590332031, 90.38438415527344, 94.83534240722656, 99.28630065917969, 103.73725891113281, 108.18821716308594, 112.63917541503906, 117.09013366699219, 121.54109191894531, 125.99205017089844, 130.44300842285156, 134.8939666748047, 139.3449249267578, 143.79588317871094, 148.24684143066406, 152.6977996826172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 23.0, 37.0, 66.0, 126.0, 153.0, 316.0, 530.0, 876.0, 1579.0, 2877.0, 5908.0, 12889.0, 34024.0, 137679.0, 3551778.0, 358117.0, 53731.0, 17676.0, 7413.0, 3760.0, 1967.0, 1104.0, 647.0, 368.0, 218.0, 131.0, 72.0, 56.0, 27.0, 25.0, 24.0, 19.0, 14.0, 12.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.125, -54.2353515625, -52.345703125, -50.4560546875, -48.56640625, -46.6767578125, -44.787109375, -42.8974609375, -41.0078125, -39.1181640625, -37.228515625, -35.3388671875, -33.44921875, -31.5595703125, -29.669921875, -27.7802734375, -25.890625, -24.0009765625, -22.111328125, -20.2216796875, -18.33203125, -16.4423828125, -14.552734375, -12.6630859375, -10.7734375, -8.8837890625, -6.994140625, -5.1044921875, -3.21484375, -1.3251953125, 0.564453125, 2.4541015625, 4.34375, 6.2333984375, 8.123046875, 10.0126953125, 11.90234375, 13.7919921875, 15.681640625, 17.5712890625, 19.4609375, 21.3505859375, 23.240234375, 25.1298828125, 27.01953125, 28.9091796875, 30.798828125, 32.6884765625, 34.578125, 36.4677734375, 38.357421875, 40.2470703125, 42.13671875, 44.0263671875, 45.916015625, 47.8056640625, 49.6953125, 51.5849609375, 53.474609375, 55.3642578125, 57.25390625, 59.1435546875, 61.033203125, 62.9228515625, 64.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 12.0, 12.0, 13.0, 18.0, 22.0, 42.0, 38.0, 34.0, 56.0, 56.0, 59.0, 78.0, 61.0, 84.0, 76.0, 72.0, 55.0, 43.0, 35.0, 27.0, 17.0, 19.0, 17.0, 9.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.550994873046875, -2.46136474609375, -2.371734619140625, -2.2821044921875, -2.192474365234375, -2.10284423828125, -2.013214111328125, -1.923583984375, -1.833953857421875, -1.74432373046875, -1.654693603515625, -1.5650634765625, -1.475433349609375, -1.38580322265625, -1.296173095703125, -1.20654296875, -1.116912841796875, -1.02728271484375, -0.937652587890625, -0.8480224609375, -0.758392333984375, -0.66876220703125, -0.579132080078125, -0.489501953125, -0.399871826171875, -0.31024169921875, -0.220611572265625, -0.1309814453125, -0.041351318359375, 0.04827880859375, 0.137908935546875, 0.2275390625, 0.317169189453125, 0.40679931640625, 0.496429443359375, 0.5860595703125, 0.675689697265625, 0.76531982421875, 0.854949951171875, 0.944580078125, 1.034210205078125, 1.12384033203125, 1.213470458984375, 1.3031005859375, 1.392730712890625, 1.48236083984375, 1.571990966796875, 1.66162109375, 1.751251220703125, 1.84088134765625, 1.930511474609375, 2.0201416015625, 2.109771728515625, 2.19940185546875, 2.289031982421875, 2.378662109375, 2.468292236328125, 2.55792236328125, 2.647552490234375, 2.7371826171875, 2.826812744140625, 2.91644287109375, 3.006072998046875, 3.095703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 14.0, 26.0, 37.0, 52.0, 74.0, 168.0, 277.0, 624.0, 1575.0, 5280.0, 22629.0, 170816.0, 3611610.0, 335762.0, 34657.0, 7112.0, 2023.0, 774.0, 343.0, 170.0, 88.0, 49.0, 30.0, 27.0, 6.0, 7.0, 7.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.625, -67.2744140625, -64.923828125, -62.5732421875, -60.22265625, -57.8720703125, -55.521484375, -53.1708984375, -50.8203125, -48.4697265625, -46.119140625, -43.7685546875, -41.41796875, -39.0673828125, -36.716796875, -34.3662109375, -32.015625, -29.6650390625, -27.314453125, -24.9638671875, -22.61328125, -20.2626953125, -17.912109375, -15.5615234375, -13.2109375, -10.8603515625, -8.509765625, -6.1591796875, -3.80859375, -1.4580078125, 0.892578125, 3.2431640625, 5.59375, 7.9443359375, 10.294921875, 12.6455078125, 14.99609375, 17.3466796875, 19.697265625, 22.0478515625, 24.3984375, 26.7490234375, 29.099609375, 31.4501953125, 33.80078125, 36.1513671875, 38.501953125, 40.8525390625, 43.203125, 45.5537109375, 47.904296875, 50.2548828125, 52.60546875, 54.9560546875, 57.306640625, 59.6572265625, 62.0078125, 64.3583984375, 66.708984375, 69.0595703125, 71.41015625, 73.7607421875, 76.111328125, 78.4619140625, 80.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 14.0, 31.0, 30.0, 57.0, 82.0, 158.0, 262.0, 650.0, 1669.0, 490.0, 231.0, 135.0, 86.0, 51.0, 23.0, 24.0, 12.0, 17.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9820556640625, -9.682861328125, -9.3836669921875, -9.08447265625, -8.7852783203125, -8.486083984375, -8.1868896484375, -7.8876953125, -7.5885009765625, -7.289306640625, -6.9901123046875, -6.69091796875, -6.3917236328125, -6.092529296875, -5.7933349609375, -5.494140625, -5.1949462890625, -4.895751953125, -4.5965576171875, -4.29736328125, -3.9981689453125, -3.698974609375, -3.3997802734375, -3.1005859375, -2.8013916015625, -2.502197265625, -2.2030029296875, -1.90380859375, -1.6046142578125, -1.305419921875, -1.0062255859375, -0.70703125, -0.4078369140625, -0.108642578125, 0.1905517578125, 0.48974609375, 0.7889404296875, 1.088134765625, 1.3873291015625, 1.6865234375, 1.9857177734375, 2.284912109375, 2.5841064453125, 2.88330078125, 3.1824951171875, 3.481689453125, 3.7808837890625, 4.080078125, 4.3792724609375, 4.678466796875, 4.9776611328125, 5.27685546875, 5.5760498046875, 5.875244140625, 6.1744384765625, 6.4736328125, 6.7728271484375, 7.072021484375, 7.3712158203125, 7.67041015625, 7.9696044921875, 8.268798828125, 8.5679931640625, 8.8671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 16.0, 21.0, 31.0, 69.0, 120.0, 176.0, 182.0, 172.0, 93.0, 48.0, 33.0, 18.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.056697845458984, -34.79891586303711, -32.5411376953125, -30.283355712890625, -28.025575637817383, -25.76779556274414, -23.510013580322266, -21.252233505249023, -18.99445343017578, -16.73667335510254, -14.47889232635498, -12.221111297607422, -9.96333122253418, -7.7055511474609375, -5.447770118713379, -3.1899890899658203, -0.9322090148925781, 1.3255715370178223, 3.5833520889282227, 5.841132640838623, 8.098913192749023, 10.356693267822266, 12.614474296569824, 14.872255325317383, 17.130035400390625, 19.387815475463867, 21.64559555053711, 23.903377532958984, 26.161157608032227, 28.41893768310547, 30.676719665527344, 32.93450164794922, 35.192283630371094, 37.45006561279297, 39.70784378051758, 41.96562576293945, 44.22340393066406, 46.48118591308594, 48.73896789550781, 50.99674987792969, 53.2545280456543, 55.51231002807617, 57.77008819580078, 60.027870178222656, 62.28565216064453, 64.54342651367188, 66.80120849609375, 69.05899047851562, 71.3167724609375, 73.57455444335938, 75.83233642578125, 78.0901107788086, 80.34789276123047, 82.60567474365234, 84.86345672607422, 87.1212387084961, 89.37901306152344, 91.63679504394531, 93.89457702636719, 96.15235137939453, 98.4101333618164, 100.66791534423828, 102.92569732666016, 105.18347930908203, 107.4412612915039]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 10.0, 13.0, 15.0, 25.0, 20.0, 22.0, 30.0, 41.0, 35.0, 51.0, 47.0, 56.0, 56.0, 46.0, 52.0, 42.0, 46.0, 46.0, 40.0, 38.0, 44.0, 32.0, 38.0, 21.0, 19.0, 24.0, 14.0, 14.0, 10.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-32.26142120361328, -31.34774398803711, -30.434066772460938, -29.520389556884766, -28.606712341308594, -27.693035125732422, -26.77935791015625, -25.86568260192871, -24.95200538635254, -24.038328170776367, -23.124650955200195, -22.210973739624023, -21.29729652404785, -20.383621215820312, -19.46994400024414, -18.55626678466797, -17.642589569091797, -16.728912353515625, -15.815235137939453, -14.901557922363281, -13.987881660461426, -13.074204444885254, -12.160527229309082, -11.246850967407227, -10.333171844482422, -9.41949462890625, -8.505817413330078, -7.5921406745910645, -6.678463935852051, -5.764786720275879, -4.851109504699707, -3.9374327659606934, -3.0237560272216797, -2.110079050064087, -1.1964019536972046, -0.28272485733032227, 0.6309521198272705, 1.5446290969848633, 2.458306312561035, 3.371983051300049, 4.285660266876221, 5.199337482452393, 6.113014221191406, 7.026691436767578, 7.94036865234375, 8.854045867919922, 9.767723083496094, 10.68139934539795, 11.595076560974121, 12.508753776550293, 13.422430992126465, 14.33610725402832, 15.249784469604492, 16.163461685180664, 17.077138900756836, 17.990816116333008, 18.90449333190918, 19.81817054748535, 20.731847763061523, 21.645524978637695, 22.559202194213867, 23.472877502441406, 24.386554718017578, 25.30023193359375, 26.213909149169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 6.0, 10.0, 17.0, 15.0, 20.0, 38.0, 42.0, 67.0, 109.0, 308.0, 1199.0, 6348.0, 43488.0, 359241.0, 545880.0, 78401.0, 10594.0, 1960.0, 405.0, 143.0, 65.0, 30.0, 32.0, 29.0, 23.0, 13.0, 12.0, 9.0, 7.0, 6.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -54.90576171875, -53.2490234375, -51.59228515625, -49.935546875, -48.27880859375, -46.6220703125, -44.96533203125, -43.30859375, -41.65185546875, -39.9951171875, -38.33837890625, -36.681640625, -35.02490234375, -33.3681640625, -31.71142578125, -30.0546875, -28.39794921875, -26.7412109375, -25.08447265625, -23.427734375, -21.77099609375, -20.1142578125, -18.45751953125, -16.80078125, -15.14404296875, -13.4873046875, -11.83056640625, -10.173828125, -8.51708984375, -6.8603515625, -5.20361328125, -3.546875, -1.89013671875, -0.2333984375, 1.42333984375, 3.080078125, 4.73681640625, 6.3935546875, 8.05029296875, 9.70703125, 11.36376953125, 13.0205078125, 14.67724609375, 16.333984375, 17.99072265625, 19.6474609375, 21.30419921875, 22.9609375, 24.61767578125, 26.2744140625, 27.93115234375, 29.587890625, 31.24462890625, 32.9013671875, 34.55810546875, 36.21484375, 37.87158203125, 39.5283203125, 41.18505859375, 42.841796875, 44.49853515625, 46.1552734375, 47.81201171875, 49.46875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 19.0, 33.0, 52.0, 45.0, 69.0, 75.0, 92.0, 99.0, 97.0, 99.0, 78.0, 65.0, 38.0, 42.0, 26.0, 17.0, 17.0, 5.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6025543212890625, -1.487335205078125, -1.3721160888671875, -1.25689697265625, -1.1416778564453125, -1.026458740234375, -0.9112396240234375, -0.7960205078125, -0.6808013916015625, -0.565582275390625, -0.4503631591796875, -0.33514404296875, -0.2199249267578125, -0.104705810546875, 0.0105133056640625, 0.125732421875, 0.2409515380859375, 0.356170654296875, 0.4713897705078125, 0.58660888671875, 0.7018280029296875, 0.817047119140625, 0.9322662353515625, 1.0474853515625, 1.1627044677734375, 1.277923583984375, 1.3931427001953125, 1.50836181640625, 1.6235809326171875, 1.738800048828125, 1.8540191650390625, 1.96923828125, 2.0844573974609375, 2.199676513671875, 2.3148956298828125, 2.43011474609375, 2.5453338623046875, 2.660552978515625, 2.7757720947265625, 2.8909912109375, 3.0062103271484375, 3.121429443359375, 3.2366485595703125, 3.35186767578125, 3.4670867919921875, 3.582305908203125, 3.6975250244140625, 3.812744140625, 3.9279632568359375, 4.043182373046875, 4.1584014892578125, 4.27362060546875, 4.3888397216796875, 4.504058837890625, 4.6192779541015625, 4.7344970703125, 4.8497161865234375, 4.964935302734375, 5.0801544189453125, 5.19537353515625, 5.3105926513671875, 5.425811767578125, 5.5410308837890625, 5.65625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 14.0, 11.0, 14.0, 17.0, 16.0, 28.0, 31.0, 43.0, 62.0, 99.0, 107.0, 169.0, 249.0, 298.0, 458.0, 718.0, 1270.0, 2468.0, 5914.0, 16521.0, 55698.0, 189123.0, 405187.0, 252774.0, 78923.0, 23462.0, 7773.0, 2993.0, 1467.0, 776.0, 527.0, 368.0, 275.0, 178.0, 137.0, 103.0, 75.0, 57.0, 31.0, 28.0, 36.0, 18.0, 14.0, 4.0, 9.0, 0.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.25, -25.420166015625, -24.59033203125, -23.760498046875, -22.9306640625, -22.100830078125, -21.27099609375, -20.441162109375, -19.611328125, -18.781494140625, -17.95166015625, -17.121826171875, -16.2919921875, -15.462158203125, -14.63232421875, -13.802490234375, -12.97265625, -12.142822265625, -11.31298828125, -10.483154296875, -9.6533203125, -8.823486328125, -7.99365234375, -7.163818359375, -6.333984375, -5.504150390625, -4.67431640625, -3.844482421875, -3.0146484375, -2.184814453125, -1.35498046875, -0.525146484375, 0.3046875, 1.134521484375, 1.96435546875, 2.794189453125, 3.6240234375, 4.453857421875, 5.28369140625, 6.113525390625, 6.943359375, 7.773193359375, 8.60302734375, 9.432861328125, 10.2626953125, 11.092529296875, 11.92236328125, 12.752197265625, 13.58203125, 14.411865234375, 15.24169921875, 16.071533203125, 16.9013671875, 17.731201171875, 18.56103515625, 19.390869140625, 20.220703125, 21.050537109375, 21.88037109375, 22.710205078125, 23.5400390625, 24.369873046875, 25.19970703125, 26.029541015625, 26.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 12.0, 11.0, 18.0, 16.0, 17.0, 28.0, 18.0, 31.0, 28.0, 37.0, 40.0, 41.0, 31.0, 58.0, 45.0, 49.0, 40.0, 50.0, 56.0, 46.0, 27.0, 37.0, 37.0, 38.0, 16.0, 23.0, 15.0, 21.0, 21.0, 15.0, 17.0, 10.0, 6.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.1953125, -12.8140869140625, -12.432861328125, -12.0516357421875, -11.67041015625, -11.2891845703125, -10.907958984375, -10.5267333984375, -10.1455078125, -9.7642822265625, -9.383056640625, -9.0018310546875, -8.62060546875, -8.2393798828125, -7.858154296875, -7.4769287109375, -7.095703125, -6.7144775390625, -6.333251953125, -5.9520263671875, -5.57080078125, -5.1895751953125, -4.808349609375, -4.4271240234375, -4.0458984375, -3.6646728515625, -3.283447265625, -2.9022216796875, -2.52099609375, -2.1397705078125, -1.758544921875, -1.3773193359375, -0.99609375, -0.6148681640625, -0.233642578125, 0.1475830078125, 0.52880859375, 0.9100341796875, 1.291259765625, 1.6724853515625, 2.0537109375, 2.4349365234375, 2.816162109375, 3.1973876953125, 3.57861328125, 3.9598388671875, 4.341064453125, 4.7222900390625, 5.103515625, 5.4847412109375, 5.865966796875, 6.2471923828125, 6.62841796875, 7.0096435546875, 7.390869140625, 7.7720947265625, 8.1533203125, 8.5345458984375, 8.915771484375, 9.2969970703125, 9.67822265625, 10.0594482421875, 10.440673828125, 10.8218994140625, 11.203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 12.0, 16.0, 20.0, 29.0, 49.0, 90.0, 127.0, 225.0, 407.0, 753.0, 1362.0, 3100.0, 7549.0, 21899.0, 73770.0, 258416.0, 424315.0, 179603.0, 50872.0, 15546.0, 5460.0, 2395.0, 1128.0, 569.0, 303.0, 196.0, 132.0, 63.0, 42.0, 26.0, 21.0, 18.0, 18.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.613037109375, -18.77294921875, -17.932861328125, -17.0927734375, -16.252685546875, -15.41259765625, -14.572509765625, -13.732421875, -12.892333984375, -12.05224609375, -11.212158203125, -10.3720703125, -9.531982421875, -8.69189453125, -7.851806640625, -7.01171875, -6.171630859375, -5.33154296875, -4.491455078125, -3.6513671875, -2.811279296875, -1.97119140625, -1.131103515625, -0.291015625, 0.549072265625, 1.38916015625, 2.229248046875, 3.0693359375, 3.909423828125, 4.74951171875, 5.589599609375, 6.4296875, 7.269775390625, 8.10986328125, 8.949951171875, 9.7900390625, 10.630126953125, 11.47021484375, 12.310302734375, 13.150390625, 13.990478515625, 14.83056640625, 15.670654296875, 16.5107421875, 17.350830078125, 18.19091796875, 19.031005859375, 19.87109375, 20.711181640625, 21.55126953125, 22.391357421875, 23.2314453125, 24.071533203125, 24.91162109375, 25.751708984375, 26.591796875, 27.431884765625, 28.27197265625, 29.112060546875, 29.9521484375, 30.792236328125, 31.63232421875, 32.472412109375, 33.3125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 22.0, 28.0, 32.0, 33.0, 40.0, 47.0, 54.0, 83.0, 90.0, 88.0, 107.0, 66.0, 57.0, 44.0, 44.0, 30.0, 30.0, 16.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00262451171875, -0.0025433599948883057, -0.0024622082710266113, -0.002381056547164917, -0.0022999048233032227, -0.0022187530994415283, -0.002137601375579834, -0.0020564496517181396, -0.0019752979278564453, -0.001894146203994751, -0.0018129944801330566, -0.0017318427562713623, -0.001650691032409668, -0.0015695393085479736, -0.0014883875846862793, -0.001407235860824585, -0.0013260841369628906, -0.0012449324131011963, -0.001163780689239502, -0.0010826289653778076, -0.0010014772415161133, -0.0009203255176544189, -0.0008391737937927246, -0.0007580220699310303, -0.0006768703460693359, -0.0005957186222076416, -0.0005145668983459473, -0.00043341517448425293, -0.0003522634506225586, -0.00027111172676086426, -0.00018996000289916992, -0.00010880827903747559, -2.765655517578125e-05, 5.3495168685913086e-05, 0.00013464689254760742, 0.00021579861640930176, 0.0002969503402709961, 0.00037810206413269043, 0.00045925378799438477, 0.0005404055118560791, 0.0006215572357177734, 0.0007027089595794678, 0.0007838606834411621, 0.0008650124073028564, 0.0009461641311645508, 0.0010273158550262451, 0.0011084675788879395, 0.0011896193027496338, 0.0012707710266113281, 0.0013519227504730225, 0.0014330744743347168, 0.0015142261981964111, 0.0015953779220581055, 0.0016765296459197998, 0.0017576813697814941, 0.0018388330936431885, 0.0019199848175048828, 0.002001136541366577, 0.0020822882652282715, 0.002163439989089966, 0.00224459171295166, 0.0023257434368133545, 0.002406895160675049, 0.002488046884536743, 0.0025691986083984375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 7.0, 13.0, 13.0, 20.0, 18.0, 21.0, 31.0, 53.0, 65.0, 103.0, 144.0, 173.0, 336.0, 589.0, 1171.0, 2268.0, 5334.0, 14274.0, 43287.0, 153118.0, 416964.0, 286311.0, 82616.0, 25123.0, 9000.0, 3647.0, 1604.0, 879.0, 443.0, 279.0, 190.0, 125.0, 97.0, 74.0, 37.0, 29.0, 22.0, 19.0, 10.0, 8.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.33154296875, -25.4755859375, -24.61962890625, -23.763671875, -22.90771484375, -22.0517578125, -21.19580078125, -20.33984375, -19.48388671875, -18.6279296875, -17.77197265625, -16.916015625, -16.06005859375, -15.2041015625, -14.34814453125, -13.4921875, -12.63623046875, -11.7802734375, -10.92431640625, -10.068359375, -9.21240234375, -8.3564453125, -7.50048828125, -6.64453125, -5.78857421875, -4.9326171875, -4.07666015625, -3.220703125, -2.36474609375, -1.5087890625, -0.65283203125, 0.203125, 1.05908203125, 1.9150390625, 2.77099609375, 3.626953125, 4.48291015625, 5.3388671875, 6.19482421875, 7.05078125, 7.90673828125, 8.7626953125, 9.61865234375, 10.474609375, 11.33056640625, 12.1865234375, 13.04248046875, 13.8984375, 14.75439453125, 15.6103515625, 16.46630859375, 17.322265625, 18.17822265625, 19.0341796875, 19.89013671875, 20.74609375, 21.60205078125, 22.4580078125, 23.31396484375, 24.169921875, 25.02587890625, 25.8818359375, 26.73779296875, 27.59375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 8.0, 13.0, 8.0, 16.0, 18.0, 22.0, 37.0, 48.0, 35.0, 66.0, 56.0, 63.0, 81.0, 70.0, 78.0, 59.0, 60.0, 44.0, 36.0, 30.0, 27.0, 26.0, 22.0, 15.0, 3.0, 12.0, 8.0, 8.0, 8.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8812255859375, -12.496826171875, -12.1124267578125, -11.72802734375, -11.3436279296875, -10.959228515625, -10.5748291015625, -10.1904296875, -9.8060302734375, -9.421630859375, -9.0372314453125, -8.65283203125, -8.2684326171875, -7.884033203125, -7.4996337890625, -7.115234375, -6.7308349609375, -6.346435546875, -5.9620361328125, -5.57763671875, -5.1932373046875, -4.808837890625, -4.4244384765625, -4.0400390625, -3.6556396484375, -3.271240234375, -2.8868408203125, -2.50244140625, -2.1180419921875, -1.733642578125, -1.3492431640625, -0.96484375, -0.5804443359375, -0.196044921875, 0.1883544921875, 0.57275390625, 0.9571533203125, 1.341552734375, 1.7259521484375, 2.1103515625, 2.4947509765625, 2.879150390625, 3.2635498046875, 3.64794921875, 4.0323486328125, 4.416748046875, 4.8011474609375, 5.185546875, 5.5699462890625, 5.954345703125, 6.3387451171875, 6.72314453125, 7.1075439453125, 7.491943359375, 7.8763427734375, 8.2607421875, 8.6451416015625, 9.029541015625, 9.4139404296875, 9.79833984375, 10.1827392578125, 10.567138671875, 10.9515380859375, 11.3359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 11.0, 29.0, 49.0, 84.0, 164.0, 191.0, 172.0, 127.0, 75.0, 39.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.6391296386719, -249.26834106445312, -241.89755249023438, -234.52676391601562, -227.1559600830078, -219.78517150878906, -212.4143829345703, -205.04359436035156, -197.67279052734375, -190.302001953125, -182.93121337890625, -175.5604248046875, -168.1896209716797, -160.81883239746094, -153.4480438232422, -146.07725524902344, -138.7064666748047, -131.33567810058594, -123.96488189697266, -116.5940933227539, -109.22329711914062, -101.85250854492188, -94.48171997070312, -87.11093139648438, -79.7401351928711, -72.36934661865234, -64.99855041503906, -57.62776184082031, -50.2569694519043, -42.88617706298828, -35.51538848876953, -28.144596099853516, -20.7738037109375, -13.4030122756958, -6.032220840454102, 1.3385696411132812, 8.709362030029297, 16.080154418945312, 23.450942993164062, 30.821735382080078, 38.192527770996094, 45.56332015991211, 52.934112548828125, 60.304901123046875, 67.67568969726562, 75.0464859008789, 82.41727447509766, 89.78807067871094, 97.15885925292969, 104.52964782714844, 111.90044403076172, 119.27123260498047, 126.64202880859375, 134.0128173828125, 141.38360595703125, 148.75439453125, 156.12518310546875, 163.4959716796875, 170.86676025390625, 178.237548828125, 185.6083526611328, 192.97914123535156, 200.3499298095703, 207.72071838378906, 215.09152221679688]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 7.0, 12.0, 22.0, 18.0, 28.0, 33.0, 31.0, 46.0, 40.0, 47.0, 51.0, 63.0, 50.0, 64.0, 47.0, 44.0, 60.0, 49.0, 49.0, 37.0, 35.0, 30.0, 26.0, 19.0, 19.0, 15.0, 13.0, 7.0, 15.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-142.22293090820312, -138.83920288085938, -135.45547485351562, -132.07174682617188, -128.6880340576172, -125.30430603027344, -121.92057800292969, -118.53684997558594, -115.15312957763672, -111.76940155029297, -108.38568115234375, -105.001953125, -101.61822509765625, -98.23450469970703, -94.85077667236328, -91.46705627441406, -88.08332824707031, -84.69960021972656, -81.31587982177734, -77.9321517944336, -74.54842376708984, -71.16470336914062, -67.78097534179688, -64.39724731445312, -61.013519287109375, -57.62979507446289, -54.24606704711914, -50.862342834472656, -47.47861862182617, -44.09489440917969, -40.71116638183594, -37.32744216918945, -33.94371795654297, -30.55999183654785, -27.176267623901367, -23.79254150390625, -20.408817291259766, -17.02509117126465, -13.641365051269531, -10.257640838623047, -6.87391471862793, -3.49018931388855, -0.10646390914916992, 3.277261734008789, 6.66098690032959, 10.04471206665039, 13.428438186645508, 16.812162399291992, 20.19588851928711, 23.579614639282227, 26.96333885192871, 30.347064971923828, 33.73078918457031, 37.11451721191406, 40.49824142456055, 43.88196563720703, 47.26569366455078, 50.649417877197266, 54.033145904541016, 57.4168701171875, 60.800594329833984, 64.18431854248047, 67.56804656982422, 70.95176696777344, 74.33549499511719]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 13.0, 21.0, 35.0, 57.0, 97.0, 235.0, 1787.0, 42350.0, 4097835.0, 49331.0, 1845.0, 302.0, 132.0, 93.0, 42.0, 34.0, 28.0, 13.0, 12.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.75, -140.25390625, -134.7578125, -129.26171875, -123.765625, -118.26953125, -112.7734375, -107.27734375, -101.78125, -96.28515625, -90.7890625, -85.29296875, -79.796875, -74.30078125, -68.8046875, -63.30859375, -57.8125, -52.31640625, -46.8203125, -41.32421875, -35.828125, -30.33203125, -24.8359375, -19.33984375, -13.84375, -8.34765625, -2.8515625, 2.64453125, 8.140625, 13.63671875, 19.1328125, 24.62890625, 30.125, 35.62109375, 41.1171875, 46.61328125, 52.109375, 57.60546875, 63.1015625, 68.59765625, 74.09375, 79.58984375, 85.0859375, 90.58203125, 96.078125, 101.57421875, 107.0703125, 112.56640625, 118.0625, 123.55859375, 129.0546875, 134.55078125, 140.046875, 145.54296875, 151.0390625, 156.53515625, 162.03125, 167.52734375, 173.0234375, 178.51953125, 184.015625, 189.51171875, 195.0078125, 200.50390625, 206.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 19.0, 34.0, 42.0, 66.0, 70.0, 94.0, 103.0, 104.0, 89.0, 95.0, 76.0, 65.0, 40.0, 23.0, 20.0, 17.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.072021484375, -3.91748046875, -3.762939453125, -3.6083984375, -3.453857421875, -3.29931640625, -3.144775390625, -2.990234375, -2.835693359375, -2.68115234375, -2.526611328125, -2.3720703125, -2.217529296875, -2.06298828125, -1.908447265625, -1.75390625, -1.599365234375, -1.44482421875, -1.290283203125, -1.1357421875, -0.981201171875, -0.82666015625, -0.672119140625, -0.517578125, -0.363037109375, -0.20849609375, -0.053955078125, 0.1005859375, 0.255126953125, 0.40966796875, 0.564208984375, 0.71875, 0.873291015625, 1.02783203125, 1.182373046875, 1.3369140625, 1.491455078125, 1.64599609375, 1.800537109375, 1.955078125, 2.109619140625, 2.26416015625, 2.418701171875, 2.5732421875, 2.727783203125, 2.88232421875, 3.036865234375, 3.19140625, 3.345947265625, 3.50048828125, 3.655029296875, 3.8095703125, 3.964111328125, 4.11865234375, 4.273193359375, 4.427734375, 4.582275390625, 4.73681640625, 4.891357421875, 5.0458984375, 5.200439453125, 5.35498046875, 5.509521484375, 5.6640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 12.0, 7.0, 11.0, 15.0, 16.0, 21.0, 24.0, 26.0, 45.0, 60.0, 94.0, 121.0, 191.0, 313.0, 585.0, 1165.0, 2797.0, 7862.0, 26771.0, 120375.0, 1201273.0, 2622468.0, 160235.0, 34006.0, 9535.0, 3259.0, 1391.0, 655.0, 321.0, 205.0, 140.0, 76.0, 45.0, 41.0, 24.0, 24.0, 18.0, 13.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.78125, -52.248046875, -50.71484375, -49.181640625, -47.6484375, -46.115234375, -44.58203125, -43.048828125, -41.515625, -39.982421875, -38.44921875, -36.916015625, -35.3828125, -33.849609375, -32.31640625, -30.783203125, -29.25, -27.716796875, -26.18359375, -24.650390625, -23.1171875, -21.583984375, -20.05078125, -18.517578125, -16.984375, -15.451171875, -13.91796875, -12.384765625, -10.8515625, -9.318359375, -7.78515625, -6.251953125, -4.71875, -3.185546875, -1.65234375, -0.119140625, 1.4140625, 2.947265625, 4.48046875, 6.013671875, 7.546875, 9.080078125, 10.61328125, 12.146484375, 13.6796875, 15.212890625, 16.74609375, 18.279296875, 19.8125, 21.345703125, 22.87890625, 24.412109375, 25.9453125, 27.478515625, 29.01171875, 30.544921875, 32.078125, 33.611328125, 35.14453125, 36.677734375, 38.2109375, 39.744140625, 41.27734375, 42.810546875, 44.34375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 9.0, 33.0, 23.0, 49.0, 79.0, 141.0, 281.0, 725.0, 1656.0, 511.0, 203.0, 130.0, 63.0, 60.0, 35.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.015625, -15.645751953125, -15.27587890625, -14.906005859375, -14.5361328125, -14.166259765625, -13.79638671875, -13.426513671875, -13.056640625, -12.686767578125, -12.31689453125, -11.947021484375, -11.5771484375, -11.207275390625, -10.83740234375, -10.467529296875, -10.09765625, -9.727783203125, -9.35791015625, -8.988037109375, -8.6181640625, -8.248291015625, -7.87841796875, -7.508544921875, -7.138671875, -6.768798828125, -6.39892578125, -6.029052734375, -5.6591796875, -5.289306640625, -4.91943359375, -4.549560546875, -4.1796875, -3.809814453125, -3.43994140625, -3.070068359375, -2.7001953125, -2.330322265625, -1.96044921875, -1.590576171875, -1.220703125, -0.850830078125, -0.48095703125, -0.111083984375, 0.2587890625, 0.628662109375, 0.99853515625, 1.368408203125, 1.73828125, 2.108154296875, 2.47802734375, 2.847900390625, 3.2177734375, 3.587646484375, 3.95751953125, 4.327392578125, 4.697265625, 5.067138671875, 5.43701171875, 5.806884765625, 6.1767578125, 6.546630859375, 6.91650390625, 7.286376953125, 7.65625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 14.0, 50.0, 118.0, 200.0, 263.0, 172.0, 107.0, 42.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.45655822753906, -179.21998596191406, -174.9833984375, -170.746826171875, -166.51025390625, -162.273681640625, -158.037109375, -153.80052185058594, -149.56394958496094, -145.32737731933594, -141.09078979492188, -136.85421752929688, -132.61764526367188, -128.38107299804688, -124.14449310302734, -119.90791320800781, -115.67134094238281, -111.43476867675781, -107.19818878173828, -102.96160888671875, -98.72503662109375, -94.48846435546875, -90.25188446044922, -86.01530456542969, -81.77873229980469, -77.54216003417969, -73.30558013916016, -69.06900024414062, -64.83242797851562, -60.59585189819336, -56.359275817871094, -52.12269973754883, -47.88611602783203, -43.649539947509766, -39.4129638671875, -35.176387786865234, -30.93981170654297, -26.703235626220703, -22.466659545898438, -18.230083465576172, -13.993507385253906, -9.75693130493164, -5.520355224609375, -1.2837791442871094, 2.9527969360351562, 7.189373016357422, 11.425949096679688, 15.662525177001953, 19.89910125732422, 24.135677337646484, 28.37225341796875, 32.608829498291016, 36.84540557861328, 41.08198165893555, 45.31855773925781, 49.55513381958008, 53.791709899902344, 58.02828598022461, 62.264862060546875, 66.50143432617188, 70.7380142211914, 74.97459411621094, 79.21116638183594, 83.44773864746094, 87.68431854248047]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 5.0, 8.0, 10.0, 12.0, 20.0, 13.0, 31.0, 18.0, 29.0, 20.0, 33.0, 36.0, 45.0, 42.0, 43.0, 34.0, 40.0, 41.0, 35.0, 35.0, 51.0, 41.0, 41.0, 36.0, 32.0, 26.0, 31.0, 25.0, 18.0, 20.0, 17.0, 21.0, 9.0, 17.0, 8.0, 14.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.88884735107422, -30.899494171142578, -29.91014289855957, -28.92078971862793, -27.931438446044922, -26.94208526611328, -25.95273208618164, -24.963380813598633, -23.974027633666992, -22.98467445373535, -21.995323181152344, -21.005970001220703, -20.016618728637695, -19.027265548706055, -18.037914276123047, -17.048561096191406, -16.059207916259766, -15.069855690002441, -14.080503463745117, -13.091150283813477, -12.101798057556152, -11.112445831298828, -10.123093605041504, -9.13374137878418, -8.144390106201172, -7.155037879943848, -6.165685176849365, -5.176332950592041, -4.186980247497559, -3.1976280212402344, -2.20827579498291, -1.2189230918884277, -0.2295703887939453, 0.7597820162773132, 1.7491344213485718, 2.7384867668151855, 3.727839231491089, 4.717191696166992, 5.706543922424316, 6.695896625518799, 7.685248851776123, 8.674601554870605, 9.66395378112793, 10.653306007385254, 11.642658233642578, 12.632011413574219, 13.621362686157227, 14.610715866088867, 15.600068092346191, 16.589420318603516, 17.578773498535156, 18.568124771118164, 19.557477951049805, 20.546829223632812, 21.536182403564453, 22.525535583496094, 23.5148868560791, 24.504240036010742, 25.49359130859375, 26.48294448852539, 27.4722957611084, 28.46164894104004, 29.451000213623047, 30.440353393554688, 31.429706573486328]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 12.0, 8.0, 19.0, 17.0, 34.0, 28.0, 32.0, 55.0, 75.0, 125.0, 234.0, 442.0, 1133.0, 3194.0, 10380.0, 36794.0, 135507.0, 388350.0, 328191.0, 103536.0, 27934.0, 8031.0, 2475.0, 947.0, 379.0, 191.0, 107.0, 83.0, 46.0, 33.0, 32.0, 17.0, 17.0, 18.0, 8.0, 10.0, 4.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.203125, -29.284912109375, -28.36669921875, -27.448486328125, -26.5302734375, -25.612060546875, -24.69384765625, -23.775634765625, -22.857421875, -21.939208984375, -21.02099609375, -20.102783203125, -19.1845703125, -18.266357421875, -17.34814453125, -16.429931640625, -15.51171875, -14.593505859375, -13.67529296875, -12.757080078125, -11.8388671875, -10.920654296875, -10.00244140625, -9.084228515625, -8.166015625, -7.247802734375, -6.32958984375, -5.411376953125, -4.4931640625, -3.574951171875, -2.65673828125, -1.738525390625, -0.8203125, 0.097900390625, 1.01611328125, 1.934326171875, 2.8525390625, 3.770751953125, 4.68896484375, 5.607177734375, 6.525390625, 7.443603515625, 8.36181640625, 9.280029296875, 10.1982421875, 11.116455078125, 12.03466796875, 12.952880859375, 13.87109375, 14.789306640625, 15.70751953125, 16.625732421875, 17.5439453125, 18.462158203125, 19.38037109375, 20.298583984375, 21.216796875, 22.135009765625, 23.05322265625, 23.971435546875, 24.8896484375, 25.807861328125, 26.72607421875, 27.644287109375, 28.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 8.0, 26.0, 18.0, 35.0, 40.0, 60.0, 61.0, 75.0, 100.0, 91.0, 93.0, 84.0, 80.0, 62.0, 53.0, 39.0, 30.0, 16.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.03277587890625, -3.8819580078125, -3.73114013671875, -3.580322265625, -3.42950439453125, -3.2786865234375, -3.12786865234375, -2.97705078125, -2.82623291015625, -2.6754150390625, -2.52459716796875, -2.373779296875, -2.22296142578125, -2.0721435546875, -1.92132568359375, -1.7705078125, -1.61968994140625, -1.4688720703125, -1.31805419921875, -1.167236328125, -1.01641845703125, -0.8656005859375, -0.71478271484375, -0.56396484375, -0.41314697265625, -0.2623291015625, -0.11151123046875, 0.039306640625, 0.19012451171875, 0.3409423828125, 0.49176025390625, 0.642578125, 0.79339599609375, 0.9442138671875, 1.09503173828125, 1.245849609375, 1.39666748046875, 1.5474853515625, 1.69830322265625, 1.84912109375, 1.99993896484375, 2.1507568359375, 2.30157470703125, 2.452392578125, 2.60321044921875, 2.7540283203125, 2.90484619140625, 3.0556640625, 3.20648193359375, 3.3572998046875, 3.50811767578125, 3.658935546875, 3.80975341796875, 3.9605712890625, 4.11138916015625, 4.26220703125, 4.41302490234375, 4.5638427734375, 4.71466064453125, 4.865478515625, 5.01629638671875, 5.1671142578125, 5.31793212890625, 5.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 14.0, 23.0, 22.0, 44.0, 53.0, 67.0, 88.0, 120.0, 190.0, 306.0, 418.0, 626.0, 1136.0, 2296.0, 6296.0, 23377.0, 108402.0, 439809.0, 358500.0, 79307.0, 17573.0, 5044.0, 1984.0, 1025.0, 561.0, 373.0, 251.0, 178.0, 116.0, 94.0, 69.0, 40.0, 37.0, 29.0, 12.0, 15.0, 7.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.75, -30.72265625, -29.6953125, -28.66796875, -27.640625, -26.61328125, -25.5859375, -24.55859375, -23.53125, -22.50390625, -21.4765625, -20.44921875, -19.421875, -18.39453125, -17.3671875, -16.33984375, -15.3125, -14.28515625, -13.2578125, -12.23046875, -11.203125, -10.17578125, -9.1484375, -8.12109375, -7.09375, -6.06640625, -5.0390625, -4.01171875, -2.984375, -1.95703125, -0.9296875, 0.09765625, 1.125, 2.15234375, 3.1796875, 4.20703125, 5.234375, 6.26171875, 7.2890625, 8.31640625, 9.34375, 10.37109375, 11.3984375, 12.42578125, 13.453125, 14.48046875, 15.5078125, 16.53515625, 17.5625, 18.58984375, 19.6171875, 20.64453125, 21.671875, 22.69921875, 23.7265625, 24.75390625, 25.78125, 26.80859375, 27.8359375, 28.86328125, 29.890625, 30.91796875, 31.9453125, 32.97265625, 34.0]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 7.0, 12.0, 17.0, 23.0, 17.0, 33.0, 27.0, 25.0, 37.0, 34.0, 40.0, 42.0, 44.0, 49.0, 46.0, 51.0, 44.0, 50.0, 40.0, 46.0, 31.0, 39.0, 38.0, 23.0, 26.0, 17.0, 19.0, 19.0, 14.0, 8.0, 8.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0626220703125, -13.601806640625, -13.1409912109375, -12.68017578125, -12.2193603515625, -11.758544921875, -11.2977294921875, -10.8369140625, -10.3760986328125, -9.915283203125, -9.4544677734375, -8.99365234375, -8.5328369140625, -8.072021484375, -7.6112060546875, -7.150390625, -6.6895751953125, -6.228759765625, -5.7679443359375, -5.30712890625, -4.8463134765625, -4.385498046875, -3.9246826171875, -3.4638671875, -3.0030517578125, -2.542236328125, -2.0814208984375, -1.62060546875, -1.1597900390625, -0.698974609375, -0.2381591796875, 0.22265625, 0.6834716796875, 1.144287109375, 1.6051025390625, 2.06591796875, 2.5267333984375, 2.987548828125, 3.4483642578125, 3.9091796875, 4.3699951171875, 4.830810546875, 5.2916259765625, 5.75244140625, 6.2132568359375, 6.674072265625, 7.1348876953125, 7.595703125, 8.0565185546875, 8.517333984375, 8.9781494140625, 9.43896484375, 9.8997802734375, 10.360595703125, 10.8214111328125, 11.2822265625, 11.7430419921875, 12.203857421875, 12.6646728515625, 13.12548828125, 13.5863037109375, 14.047119140625, 14.5079345703125, 14.96875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 16.0, 19.0, 35.0, 54.0, 74.0, 152.0, 214.0, 420.0, 741.0, 1674.0, 4044.0, 11536.0, 41975.0, 210372.0, 545070.0, 178645.0, 36264.0, 10246.0, 3722.0, 1567.0, 773.0, 353.0, 240.0, 116.0, 80.0, 39.0, 26.0, 19.0, 17.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.755615234375, -20.93310546875, -20.110595703125, -19.2880859375, -18.465576171875, -17.64306640625, -16.820556640625, -15.998046875, -15.175537109375, -14.35302734375, -13.530517578125, -12.7080078125, -11.885498046875, -11.06298828125, -10.240478515625, -9.41796875, -8.595458984375, -7.77294921875, -6.950439453125, -6.1279296875, -5.305419921875, -4.48291015625, -3.660400390625, -2.837890625, -2.015380859375, -1.19287109375, -0.370361328125, 0.4521484375, 1.274658203125, 2.09716796875, 2.919677734375, 3.7421875, 4.564697265625, 5.38720703125, 6.209716796875, 7.0322265625, 7.854736328125, 8.67724609375, 9.499755859375, 10.322265625, 11.144775390625, 11.96728515625, 12.789794921875, 13.6123046875, 14.434814453125, 15.25732421875, 16.079833984375, 16.90234375, 17.724853515625, 18.54736328125, 19.369873046875, 20.1923828125, 21.014892578125, 21.83740234375, 22.659912109375, 23.482421875, 24.304931640625, 25.12744140625, 25.949951171875, 26.7724609375, 27.594970703125, 28.41748046875, 29.239990234375, 30.0625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 12.0, 10.0, 24.0, 34.0, 40.0, 39.0, 47.0, 72.0, 74.0, 77.0, 89.0, 75.0, 69.0, 65.0, 62.0, 42.0, 41.0, 21.0, 20.0, 15.0, 16.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017547607421875, -0.0016904175281524658, -0.0016260743141174316, -0.0015617311000823975, -0.0014973878860473633, -0.001433044672012329, -0.001368701457977295, -0.0013043582439422607, -0.0012400150299072266, -0.0011756718158721924, -0.0011113286018371582, -0.001046985387802124, -0.0009826421737670898, -0.0009182989597320557, -0.0008539557456970215, -0.0007896125316619873, -0.0007252693176269531, -0.0006609261035919189, -0.0005965828895568848, -0.0005322396755218506, -0.0004678964614868164, -0.0004035532474517822, -0.00033921003341674805, -0.00027486681938171387, -0.0002105236053466797, -0.0001461803913116455, -8.183717727661133e-05, -1.749396324157715e-05, 4.684925079345703e-05, 0.00011119246482849121, 0.0001755356788635254, 0.00023987889289855957, 0.00030422210693359375, 0.00036856532096862793, 0.0004329085350036621, 0.0004972517490386963, 0.0005615949630737305, 0.0006259381771087646, 0.0006902813911437988, 0.000754624605178833, 0.0008189678192138672, 0.0008833110332489014, 0.0009476542472839355, 0.0010119974613189697, 0.001076340675354004, 0.001140683889389038, 0.0012050271034240723, 0.0012693703174591064, 0.0013337135314941406, 0.0013980567455291748, 0.001462399959564209, 0.0015267431735992432, 0.0015910863876342773, 0.0016554296016693115, 0.0017197728157043457, 0.0017841160297393799, 0.001848459243774414, 0.0019128024578094482, 0.0019771456718444824, 0.0020414888858795166, 0.0021058320999145508, 0.002170175313949585, 0.002234518527984619, 0.0022988617420196533, 0.0023632049560546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 9.0, 14.0, 18.0, 34.0, 46.0, 71.0, 132.0, 232.0, 393.0, 780.0, 1727.0, 4260.0, 16191.0, 121039.0, 637198.0, 229432.0, 26747.0, 5893.0, 2169.0, 948.0, 506.0, 296.0, 138.0, 104.0, 64.0, 26.0, 17.0, 15.0, 4.0, 8.0, 5.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.59375, -44.382568359375, -43.17138671875, -41.960205078125, -40.7490234375, -39.537841796875, -38.32666015625, -37.115478515625, -35.904296875, -34.693115234375, -33.48193359375, -32.270751953125, -31.0595703125, -29.848388671875, -28.63720703125, -27.426025390625, -26.21484375, -25.003662109375, -23.79248046875, -22.581298828125, -21.3701171875, -20.158935546875, -18.94775390625, -17.736572265625, -16.525390625, -15.314208984375, -14.10302734375, -12.891845703125, -11.6806640625, -10.469482421875, -9.25830078125, -8.047119140625, -6.8359375, -5.624755859375, -4.41357421875, -3.202392578125, -1.9912109375, -0.780029296875, 0.43115234375, 1.642333984375, 2.853515625, 4.064697265625, 5.27587890625, 6.487060546875, 7.6982421875, 8.909423828125, 10.12060546875, 11.331787109375, 12.54296875, 13.754150390625, 14.96533203125, 16.176513671875, 17.3876953125, 18.598876953125, 19.81005859375, 21.021240234375, 22.232421875, 23.443603515625, 24.65478515625, 25.865966796875, 27.0771484375, 28.288330078125, 29.49951171875, 30.710693359375, 31.921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 12.0, 10.0, 23.0, 34.0, 51.0, 66.0, 78.0, 79.0, 88.0, 95.0, 95.0, 76.0, 68.0, 58.0, 46.0, 33.0, 19.0, 19.0, 13.0, 7.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.4141845703125, -13.804931640625, -13.1956787109375, -12.58642578125, -11.9771728515625, -11.367919921875, -10.7586669921875, -10.1494140625, -9.5401611328125, -8.930908203125, -8.3216552734375, -7.71240234375, -7.1031494140625, -6.493896484375, -5.8846435546875, -5.275390625, -4.6661376953125, -4.056884765625, -3.4476318359375, -2.83837890625, -2.2291259765625, -1.619873046875, -1.0106201171875, -0.4013671875, 0.2078857421875, 0.817138671875, 1.4263916015625, 2.03564453125, 2.6448974609375, 3.254150390625, 3.8634033203125, 4.47265625, 5.0819091796875, 5.691162109375, 6.3004150390625, 6.90966796875, 7.5189208984375, 8.128173828125, 8.7374267578125, 9.3466796875, 9.9559326171875, 10.565185546875, 11.1744384765625, 11.78369140625, 12.3929443359375, 13.002197265625, 13.6114501953125, 14.220703125, 14.8299560546875, 15.439208984375, 16.0484619140625, 16.65771484375, 17.2669677734375, 17.876220703125, 18.4854736328125, 19.0947265625, 19.7039794921875, 20.313232421875, 20.9224853515625, 21.53173828125, 22.1409912109375, 22.750244140625, 23.3594970703125, 23.96875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 11.0, 34.0, 112.0, 229.0, 309.0, 192.0, 83.0, 20.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-598.8878173828125, -586.2535400390625, -573.6192626953125, -560.9849853515625, -548.3506469726562, -535.7163696289062, -523.0820922851562, -510.44781494140625, -497.81353759765625, -485.17926025390625, -472.5449523925781, -459.9106750488281, -447.2763977050781, -434.6421203613281, -422.0078125, -409.37353515625, -396.7392578125, -384.10498046875, -371.4706726074219, -358.8363952636719, -346.2021179199219, -333.5678405761719, -320.93353271484375, -308.29925537109375, -295.6649475097656, -283.0306701660156, -270.3963623046875, -257.7620849609375, -245.1278076171875, -232.49351501464844, -219.85922241210938, -207.22494506835938, -194.59066772460938, -181.9563751220703, -169.3220977783203, -156.68780517578125, -144.05352783203125, -131.4192352294922, -118.78495025634766, -106.15066528320312, -93.5163803100586, -80.88209533691406, -68.24781036376953, -55.613521575927734, -42.9792366027832, -30.344951629638672, -17.710662841796875, -5.076377868652344, 7.5579071044921875, 20.19219207763672, 32.82647705078125, 45.46076583862305, 58.09505081176758, 70.72933959960938, 83.3636245727539, 95.99790954589844, 108.63219451904297, 121.2664794921875, 133.90077209472656, 146.53504943847656, 159.16934204101562, 171.80361938476562, 184.4379119873047, 197.07220458984375, 209.70648193359375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 19.0, 27.0, 39.0, 40.0, 33.0, 51.0, 47.0, 49.0, 41.0, 49.0, 62.0, 44.0, 41.0, 57.0, 49.0, 47.0, 44.0, 37.0, 30.0, 37.0, 16.0, 20.0, 9.0, 14.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.0939483642578, -127.42398071289062, -123.75401306152344, -120.08403778076172, -116.41407012939453, -112.74410247802734, -109.07412719726562, -105.40415954589844, -101.73419189453125, -98.06422424316406, -94.39425659179688, -90.72428131103516, -87.05431365966797, -83.38434600830078, -79.71437072753906, -76.04440307617188, -72.37443542480469, -68.7044677734375, -65.03450012207031, -61.364524841308594, -57.694557189941406, -54.02458953857422, -50.354618072509766, -46.68464660644531, -43.014678955078125, -39.34471130371094, -35.674739837646484, -32.00476837158203, -28.334800720214844, -24.664831161499023, -20.994861602783203, -17.324892044067383, -13.654922485351562, -9.984952926635742, -6.314983367919922, -2.6450138092041016, 1.0249557495117188, 4.694925308227539, 8.36489486694336, 12.03486442565918, 15.704833984375, 19.37480354309082, 23.04477310180664, 26.71474266052246, 30.38471221923828, 34.05467987060547, 37.72465133666992, 41.394622802734375, 45.06459045410156, 48.73455810546875, 52.4045295715332, 56.074501037597656, 59.744468688964844, 63.41443634033203, 67.08441162109375, 70.75437927246094, 74.42434692382812, 78.09431457519531, 81.7642822265625, 85.43425750732422, 89.1042251586914, 92.7741928100586, 96.44416809082031, 100.1141357421875, 103.78410339355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 6.0, 3.0, 7.0, 12.0, 11.0, 18.0, 28.0, 37.0, 36.0, 52.0, 89.0, 139.0, 272.0, 449.0, 924.0, 1971.0, 4639.0, 13197.0, 45641.0, 272647.0, 3532624.0, 255167.0, 44081.0, 13010.0, 4775.0, 2015.0, 1013.0, 478.0, 274.0, 211.0, 119.0, 81.0, 55.0, 48.0, 30.0, 23.0, 23.0, 19.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.78125, -36.455078125, -35.12890625, -33.802734375, -32.4765625, -31.150390625, -29.82421875, -28.498046875, -27.171875, -25.845703125, -24.51953125, -23.193359375, -21.8671875, -20.541015625, -19.21484375, -17.888671875, -16.5625, -15.236328125, -13.91015625, -12.583984375, -11.2578125, -9.931640625, -8.60546875, -7.279296875, -5.953125, -4.626953125, -3.30078125, -1.974609375, -0.6484375, 0.677734375, 2.00390625, 3.330078125, 4.65625, 5.982421875, 7.30859375, 8.634765625, 9.9609375, 11.287109375, 12.61328125, 13.939453125, 15.265625, 16.591796875, 17.91796875, 19.244140625, 20.5703125, 21.896484375, 23.22265625, 24.548828125, 25.875, 27.201171875, 28.52734375, 29.853515625, 31.1796875, 32.505859375, 33.83203125, 35.158203125, 36.484375, 37.810546875, 39.13671875, 40.462890625, 41.7890625, 43.115234375, 44.44140625, 45.767578125, 47.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 24.0, 34.0, 23.0, 32.0, 54.0, 50.0, 64.0, 79.0, 78.0, 68.0, 57.0, 48.0, 51.0, 68.0, 50.0, 44.0, 20.0, 24.0, 32.0, 14.0, 15.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.469329833984375, -3.34295654296875, -3.216583251953125, -3.0902099609375, -2.963836669921875, -2.83746337890625, -2.711090087890625, -2.584716796875, -2.458343505859375, -2.33197021484375, -2.205596923828125, -2.0792236328125, -1.952850341796875, -1.82647705078125, -1.700103759765625, -1.57373046875, -1.447357177734375, -1.32098388671875, -1.194610595703125, -1.0682373046875, -0.941864013671875, -0.81549072265625, -0.689117431640625, -0.562744140625, -0.436370849609375, -0.30999755859375, -0.183624267578125, -0.0572509765625, 0.069122314453125, 0.19549560546875, 0.321868896484375, 0.4482421875, 0.574615478515625, 0.70098876953125, 0.827362060546875, 0.9537353515625, 1.080108642578125, 1.20648193359375, 1.332855224609375, 1.459228515625, 1.585601806640625, 1.71197509765625, 1.838348388671875, 1.9647216796875, 2.091094970703125, 2.21746826171875, 2.343841552734375, 2.47021484375, 2.596588134765625, 2.72296142578125, 2.849334716796875, 2.9757080078125, 3.102081298828125, 3.22845458984375, 3.354827880859375, 3.481201171875, 3.607574462890625, 3.73394775390625, 3.860321044921875, 3.9866943359375, 4.113067626953125, 4.23944091796875, 4.365814208984375, 4.4921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 6.0, 10.0, 9.0, 10.0, 11.0, 21.0, 16.0, 29.0, 21.0, 34.0, 44.0, 61.0, 107.0, 238.0, 588.0, 1898.0, 11325.0, 149555.0, 3819637.0, 194009.0, 13147.0, 2219.0, 590.0, 202.0, 117.0, 74.0, 58.0, 47.0, 23.0, 26.0, 20.0, 20.0, 19.0, 15.0, 10.0, 12.0, 11.0, 14.0, 3.0, 1.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.4609375, -67.109375, -64.7578125, -62.40625, -60.0546875, -57.703125, -55.3515625, -53.0, -50.6484375, -48.296875, -45.9453125, -43.59375, -41.2421875, -38.890625, -36.5390625, -34.1875, -31.8359375, -29.484375, -27.1328125, -24.78125, -22.4296875, -20.078125, -17.7265625, -15.375, -13.0234375, -10.671875, -8.3203125, -5.96875, -3.6171875, -1.265625, 1.0859375, 3.4375, 5.7890625, 8.140625, 10.4921875, 12.84375, 15.1953125, 17.546875, 19.8984375, 22.25, 24.6015625, 26.953125, 29.3046875, 31.65625, 34.0078125, 36.359375, 38.7109375, 41.0625, 43.4140625, 45.765625, 48.1171875, 50.46875, 52.8203125, 55.171875, 57.5234375, 59.875, 62.2265625, 64.578125, 66.9296875, 69.28125, 71.6328125, 73.984375, 76.3359375, 78.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 15.0, 28.0, 55.0, 155.0, 496.0, 2310.0, 697.0, 186.0, 75.0, 27.0, 16.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.0706787109375, -8.352294921875, -7.6339111328125, -6.91552734375, -6.1971435546875, -5.478759765625, -4.7603759765625, -4.0419921875, -3.3236083984375, -2.605224609375, -1.8868408203125, -1.16845703125, -0.4500732421875, 0.268310546875, 0.9866943359375, 1.705078125, 2.4234619140625, 3.141845703125, 3.8602294921875, 4.57861328125, 5.2969970703125, 6.015380859375, 6.7337646484375, 7.4521484375, 8.1705322265625, 8.888916015625, 9.6072998046875, 10.32568359375, 11.0440673828125, 11.762451171875, 12.4808349609375, 13.19921875, 13.9176025390625, 14.635986328125, 15.3543701171875, 16.07275390625, 16.7911376953125, 17.509521484375, 18.2279052734375, 18.9462890625, 19.6646728515625, 20.383056640625, 21.1014404296875, 21.81982421875, 22.5382080078125, 23.256591796875, 23.9749755859375, 24.693359375, 25.4117431640625, 26.130126953125, 26.8485107421875, 27.56689453125, 28.2852783203125, 29.003662109375, 29.7220458984375, 30.4404296875, 31.1588134765625, 31.877197265625, 32.5955810546875, 33.31396484375, 34.0323486328125, 34.750732421875, 35.4691162109375, 36.1875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 15.0, 19.0, 36.0, 72.0, 115.0, 165.0, 184.0, 123.0, 105.0, 76.0, 27.0, 23.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.16114807128906, -78.63786315917969, -76.11457824707031, -73.59130096435547, -71.0680160522461, -68.54473114013672, -66.02144622802734, -63.49816131591797, -60.97488021850586, -58.451595306396484, -55.928314208984375, -53.405029296875, -50.881744384765625, -48.358463287353516, -45.83517837524414, -43.31189727783203, -40.788612365722656, -38.26532745361328, -35.74204635620117, -33.2187614440918, -30.695478439331055, -28.172195434570312, -25.648910522460938, -23.125627517700195, -20.602344512939453, -18.07906150817871, -15.555777549743652, -13.032493591308594, -10.509210586547852, -7.985927581787109, -5.462643623352051, -2.939359664916992, -0.41606903076171875, 2.1072144508361816, 4.630497932434082, 7.153781414031982, 9.677064895629883, 12.200347900390625, 14.723631858825684, 17.246915817260742, 19.770198822021484, 22.293481826782227, 24.81676483154297, 27.340049743652344, 29.863332748413086, 32.38661575317383, 34.9099006652832, 37.43318176269531, 39.95646667480469, 42.47975158691406, 45.00303268432617, 47.52631759643555, 50.049598693847656, 52.57288360595703, 55.096168518066406, 57.61945343017578, 60.14273452758789, 62.666019439697266, 65.18930053710938, 67.71258544921875, 70.23587036132812, 72.7591552734375, 75.28243255615234, 77.80571746826172, 80.3290023803711]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 11.0, 10.0, 7.0, 19.0, 28.0, 18.0, 35.0, 44.0, 47.0, 55.0, 63.0, 74.0, 61.0, 69.0, 61.0, 60.0, 51.0, 51.0, 53.0, 37.0, 37.0, 25.0, 18.0, 13.0, 18.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.13761901855469, -55.70052719116211, -54.26343536376953, -52.82634353637695, -51.389251708984375, -49.9521598815918, -48.51506805419922, -47.07797622680664, -45.64088439941406, -44.203792572021484, -42.766700744628906, -41.32960891723633, -39.89251708984375, -38.45542526245117, -37.018333435058594, -35.581241607666016, -34.14414978027344, -32.70705795288086, -31.26996612548828, -29.832874298095703, -28.395782470703125, -26.958690643310547, -25.52159881591797, -24.08450698852539, -22.647415161132812, -21.210323333740234, -19.773231506347656, -18.336139678955078, -16.8990478515625, -15.461956024169922, -14.024864196777344, -12.587772369384766, -11.150680541992188, -9.71358871459961, -8.276496887207031, -6.839405059814453, -5.402313232421875, -3.965221405029297, -2.5281295776367188, -1.0910377502441406, 0.3460540771484375, 1.7831459045410156, 3.2202377319335938, 4.657329559326172, 6.09442138671875, 7.531513214111328, 8.968605041503906, 10.405696868896484, 11.842788696289062, 13.27988052368164, 14.716972351074219, 16.154064178466797, 17.591156005859375, 19.028247833251953, 20.46533966064453, 21.90243148803711, 23.339523315429688, 24.776615142822266, 26.213706970214844, 27.650798797607422, 29.087890625, 30.524982452392578, 31.962074279785156, 33.399166107177734, 34.83625793457031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 11.0, 12.0, 15.0, 33.0, 32.0, 64.0, 78.0, 139.0, 226.0, 408.0, 813.0, 1567.0, 3395.0, 7340.0, 18487.0, 47728.0, 120080.0, 252779.0, 306068.0, 170344.0, 71385.0, 27563.0, 10951.0, 4665.0, 2077.0, 1055.0, 524.0, 269.0, 157.0, 104.0, 55.0, 37.0, 20.0, 14.0, 14.0, 10.0, 7.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-20.71875, -20.1466064453125, -19.574462890625, -19.0023193359375, -18.43017578125, -17.8580322265625, -17.285888671875, -16.7137451171875, -16.1416015625, -15.5694580078125, -14.997314453125, -14.4251708984375, -13.85302734375, -13.2808837890625, -12.708740234375, -12.1365966796875, -11.564453125, -10.9923095703125, -10.420166015625, -9.8480224609375, -9.27587890625, -8.7037353515625, -8.131591796875, -7.5594482421875, -6.9873046875, -6.4151611328125, -5.843017578125, -5.2708740234375, -4.69873046875, -4.1265869140625, -3.554443359375, -2.9822998046875, -2.41015625, -1.8380126953125, -1.265869140625, -0.6937255859375, -0.12158203125, 0.4505615234375, 1.022705078125, 1.5948486328125, 2.1669921875, 2.7391357421875, 3.311279296875, 3.8834228515625, 4.45556640625, 5.0277099609375, 5.599853515625, 6.1719970703125, 6.744140625, 7.3162841796875, 7.888427734375, 8.4605712890625, 9.03271484375, 9.6048583984375, 10.177001953125, 10.7491455078125, 11.3212890625, 11.8934326171875, 12.465576171875, 13.0377197265625, 13.60986328125, 14.1820068359375, 14.754150390625, 15.3262939453125, 15.8984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 3.0, 9.0, 9.0, 12.0, 9.0, 19.0, 19.0, 17.0, 27.0, 22.0, 24.0, 30.0, 32.0, 38.0, 38.0, 53.0, 56.0, 46.0, 45.0, 42.0, 32.0, 42.0, 33.0, 42.0, 36.0, 42.0, 28.0, 38.0, 29.0, 23.0, 9.0, 20.0, 13.0, 18.0, 13.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.2625732421875, -2.179443359375, -2.0963134765625, -2.01318359375, -1.9300537109375, -1.846923828125, -1.7637939453125, -1.6806640625, -1.5975341796875, -1.514404296875, -1.4312744140625, -1.34814453125, -1.2650146484375, -1.181884765625, -1.0987548828125, -1.015625, -0.9324951171875, -0.849365234375, -0.7662353515625, -0.68310546875, -0.5999755859375, -0.516845703125, -0.4337158203125, -0.3505859375, -0.2674560546875, -0.184326171875, -0.1011962890625, -0.01806640625, 0.0650634765625, 0.148193359375, 0.2313232421875, 0.314453125, 0.3975830078125, 0.480712890625, 0.5638427734375, 0.64697265625, 0.7301025390625, 0.813232421875, 0.8963623046875, 0.9794921875, 1.0626220703125, 1.145751953125, 1.2288818359375, 1.31201171875, 1.3951416015625, 1.478271484375, 1.5614013671875, 1.64453125, 1.7276611328125, 1.810791015625, 1.8939208984375, 1.97705078125, 2.0601806640625, 2.143310546875, 2.2264404296875, 2.3095703125, 2.3927001953125, 2.475830078125, 2.5589599609375, 2.64208984375, 2.7252197265625, 2.808349609375, 2.8914794921875, 2.974609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 9.0, 8.0, 19.0, 27.0, 31.0, 44.0, 69.0, 75.0, 136.0, 172.0, 193.0, 304.0, 455.0, 631.0, 1106.0, 2261.0, 5325.0, 16657.0, 58467.0, 196333.0, 409294.0, 246134.0, 76359.0, 21660.0, 6691.0, 2625.0, 1192.0, 696.0, 453.0, 299.0, 231.0, 169.0, 119.0, 84.0, 69.0, 41.0, 32.0, 21.0, 17.0, 15.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.703125, -19.059326171875, -18.41552734375, -17.771728515625, -17.1279296875, -16.484130859375, -15.84033203125, -15.196533203125, -14.552734375, -13.908935546875, -13.26513671875, -12.621337890625, -11.9775390625, -11.333740234375, -10.68994140625, -10.046142578125, -9.40234375, -8.758544921875, -8.11474609375, -7.470947265625, -6.8271484375, -6.183349609375, -5.53955078125, -4.895751953125, -4.251953125, -3.608154296875, -2.96435546875, -2.320556640625, -1.6767578125, -1.032958984375, -0.38916015625, 0.254638671875, 0.8984375, 1.542236328125, 2.18603515625, 2.829833984375, 3.4736328125, 4.117431640625, 4.76123046875, 5.405029296875, 6.048828125, 6.692626953125, 7.33642578125, 7.980224609375, 8.6240234375, 9.267822265625, 9.91162109375, 10.555419921875, 11.19921875, 11.843017578125, 12.48681640625, 13.130615234375, 13.7744140625, 14.418212890625, 15.06201171875, 15.705810546875, 16.349609375, 16.993408203125, 17.63720703125, 18.281005859375, 18.9248046875, 19.568603515625, 20.21240234375, 20.856201171875, 21.5]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 8.0, 11.0, 13.0, 19.0, 29.0, 19.0, 18.0, 42.0, 40.0, 28.0, 45.0, 40.0, 40.0, 40.0, 42.0, 46.0, 41.0, 55.0, 51.0, 50.0, 39.0, 32.0, 28.0, 27.0, 27.0, 18.0, 23.0, 16.0, 18.0, 14.0, 8.0, 6.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5, -12.0701904296875, -11.640380859375, -11.2105712890625, -10.78076171875, -10.3509521484375, -9.921142578125, -9.4913330078125, -9.0615234375, -8.6317138671875, -8.201904296875, -7.7720947265625, -7.34228515625, -6.9124755859375, -6.482666015625, -6.0528564453125, -5.623046875, -5.1932373046875, -4.763427734375, -4.3336181640625, -3.90380859375, -3.4739990234375, -3.044189453125, -2.6143798828125, -2.1845703125, -1.7547607421875, -1.324951171875, -0.8951416015625, -0.46533203125, -0.0355224609375, 0.394287109375, 0.8240966796875, 1.25390625, 1.6837158203125, 2.113525390625, 2.5433349609375, 2.97314453125, 3.4029541015625, 3.832763671875, 4.2625732421875, 4.6923828125, 5.1221923828125, 5.552001953125, 5.9818115234375, 6.41162109375, 6.8414306640625, 7.271240234375, 7.7010498046875, 8.130859375, 8.5606689453125, 8.990478515625, 9.4202880859375, 9.85009765625, 10.2799072265625, 10.709716796875, 11.1395263671875, 11.5693359375, 11.9991455078125, 12.428955078125, 12.8587646484375, 13.28857421875, 13.7183837890625, 14.148193359375, 14.5780029296875, 15.0078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 7.0, 12.0, 11.0, 25.0, 37.0, 73.0, 93.0, 159.0, 329.0, 593.0, 1502.0, 4325.0, 17947.0, 172213.0, 725797.0, 106006.0, 13367.0, 3493.0, 1255.0, 577.0, 313.0, 173.0, 97.0, 58.0, 36.0, 19.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.4375, -21.618896484375, -20.80029296875, -19.981689453125, -19.1630859375, -18.344482421875, -17.52587890625, -16.707275390625, -15.888671875, -15.070068359375, -14.25146484375, -13.432861328125, -12.6142578125, -11.795654296875, -10.97705078125, -10.158447265625, -9.33984375, -8.521240234375, -7.70263671875, -6.884033203125, -6.0654296875, -5.246826171875, -4.42822265625, -3.609619140625, -2.791015625, -1.972412109375, -1.15380859375, -0.335205078125, 0.4833984375, 1.302001953125, 2.12060546875, 2.939208984375, 3.7578125, 4.576416015625, 5.39501953125, 6.213623046875, 7.0322265625, 7.850830078125, 8.66943359375, 9.488037109375, 10.306640625, 11.125244140625, 11.94384765625, 12.762451171875, 13.5810546875, 14.399658203125, 15.21826171875, 16.036865234375, 16.85546875, 17.674072265625, 18.49267578125, 19.311279296875, 20.1298828125, 20.948486328125, 21.76708984375, 22.585693359375, 23.404296875, 24.222900390625, 25.04150390625, 25.860107421875, 26.6787109375, 27.497314453125, 28.31591796875, 29.134521484375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 9.0, 17.0, 17.0, 29.0, 25.0, 33.0, 42.0, 43.0, 84.0, 85.0, 95.0, 114.0, 82.0, 61.0, 46.0, 48.0, 32.0, 20.0, 25.0, 19.0, 11.0, 5.0, 1.0, 11.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014190673828125, -0.0013680458068847656, -0.0013170242309570312, -0.0012660026550292969, -0.0012149810791015625, -0.0011639595031738281, -0.0011129379272460938, -0.0010619163513183594, -0.001010894775390625, -0.0009598731994628906, -0.0009088516235351562, -0.0008578300476074219, -0.0008068084716796875, -0.0007557868957519531, -0.0007047653198242188, -0.0006537437438964844, -0.00060272216796875, -0.0005517005920410156, -0.0005006790161132812, -0.0004496574401855469, -0.0003986358642578125, -0.0003476142883300781, -0.00029659271240234375, -0.0002455711364746094, -0.000194549560546875, -0.00014352798461914062, -9.250640869140625e-05, -4.1484832763671875e-05, 9.5367431640625e-06, 6.0558319091796875e-05, 0.00011157989501953125, 0.00016260147094726562, 0.000213623046875, 0.0002646446228027344, 0.00031566619873046875, 0.0003666877746582031, 0.0004177093505859375, 0.0004687309265136719, 0.0005197525024414062, 0.0005707740783691406, 0.000621795654296875, 0.0006728172302246094, 0.0007238388061523438, 0.0007748603820800781, 0.0008258819580078125, 0.0008769035339355469, 0.0009279251098632812, 0.0009789466857910156, 0.00102996826171875, 0.0010809898376464844, 0.0011320114135742188, 0.0011830329895019531, 0.0012340545654296875, 0.0012850761413574219, 0.0013360977172851562, 0.0013871192932128906, 0.001438140869140625, 0.0014891624450683594, 0.0015401840209960938, 0.0015912055969238281, 0.0016422271728515625, 0.0016932487487792969, 0.0017442703247070312, 0.0017952919006347656, 0.0018463134765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 5.0, 16.0, 22.0, 32.0, 58.0, 103.0, 184.0, 378.0, 855.0, 2815.0, 14848.0, 222504.0, 751103.0, 46721.0, 6180.0, 1504.0, 600.0, 275.0, 125.0, 74.0, 52.0, 29.0, 16.0, 9.0, 8.0, 2.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.40625, -47.260498046875, -46.11474609375, -44.968994140625, -43.8232421875, -42.677490234375, -41.53173828125, -40.385986328125, -39.240234375, -38.094482421875, -36.94873046875, -35.802978515625, -34.6572265625, -33.511474609375, -32.36572265625, -31.219970703125, -30.07421875, -28.928466796875, -27.78271484375, -26.636962890625, -25.4912109375, -24.345458984375, -23.19970703125, -22.053955078125, -20.908203125, -19.762451171875, -18.61669921875, -17.470947265625, -16.3251953125, -15.179443359375, -14.03369140625, -12.887939453125, -11.7421875, -10.596435546875, -9.45068359375, -8.304931640625, -7.1591796875, -6.013427734375, -4.86767578125, -3.721923828125, -2.576171875, -1.430419921875, -0.28466796875, 0.861083984375, 2.0068359375, 3.152587890625, 4.29833984375, 5.444091796875, 6.58984375, 7.735595703125, 8.88134765625, 10.027099609375, 11.1728515625, 12.318603515625, 13.46435546875, 14.610107421875, 15.755859375, 16.901611328125, 18.04736328125, 19.193115234375, 20.3388671875, 21.484619140625, 22.63037109375, 23.776123046875, 24.921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 11.0, 11.0, 12.0, 33.0, 43.0, 61.0, 75.0, 81.0, 113.0, 101.0, 105.0, 91.0, 62.0, 53.0, 37.0, 20.0, 18.0, 17.0, 15.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.874267578125, -8.43603515625, -7.997802734375, -7.5595703125, -7.121337890625, -6.68310546875, -6.244873046875, -5.806640625, -5.368408203125, -4.93017578125, -4.491943359375, -4.0537109375, -3.615478515625, -3.17724609375, -2.739013671875, -2.30078125, -1.862548828125, -1.42431640625, -0.986083984375, -0.5478515625, -0.109619140625, 0.32861328125, 0.766845703125, 1.205078125, 1.643310546875, 2.08154296875, 2.519775390625, 2.9580078125, 3.396240234375, 3.83447265625, 4.272705078125, 4.7109375, 5.149169921875, 5.58740234375, 6.025634765625, 6.4638671875, 6.902099609375, 7.34033203125, 7.778564453125, 8.216796875, 8.655029296875, 9.09326171875, 9.531494140625, 9.9697265625, 10.407958984375, 10.84619140625, 11.284423828125, 11.72265625, 12.160888671875, 12.59912109375, 13.037353515625, 13.4755859375, 13.913818359375, 14.35205078125, 14.790283203125, 15.228515625, 15.666748046875, 16.10498046875, 16.543212890625, 16.9814453125, 17.419677734375, 17.85791015625, 18.296142578125, 18.734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 22.0, 32.0, 64.0, 99.0, 142.0, 158.0, 159.0, 120.0, 84.0, 47.0, 30.0, 17.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.94647216796875, -160.3875274658203, -154.82859802246094, -149.2696533203125, -143.71072387695312, -138.1517791748047, -132.59283447265625, -127.03389739990234, -121.47496032714844, -115.91602325439453, -110.35708618164062, -104.79814147949219, -99.23920440673828, -93.68026733398438, -88.12132263183594, -82.56238555908203, -77.00344848632812, -71.44451141357422, -65.88557434082031, -60.326629638671875, -54.76769256591797, -49.20875549316406, -43.64981460571289, -38.09087371826172, -32.53193664550781, -26.972997665405273, -21.414058685302734, -15.855119705200195, -10.296180725097656, -4.737241744995117, 0.8216972351074219, 6.380638122558594, 11.9395751953125, 17.49851417541504, 23.057453155517578, 28.616392135620117, 34.175331115722656, 39.73426818847656, 45.293209075927734, 50.852149963378906, 56.41108703613281, 61.97002410888672, 67.52896118164062, 73.08790588378906, 78.64684295654297, 84.20578002929688, 89.76472473144531, 95.32366180419922, 100.88259887695312, 106.44153594970703, 112.00047302246094, 117.55941772460938, 123.11835479736328, 128.6772918701172, 134.23623657226562, 139.795166015625, 145.35411071777344, 150.91305541992188, 156.47198486328125, 162.0309295654297, 167.58987426757812, 173.1488037109375, 178.70774841308594, 184.26669311523438, 189.82562255859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 4.0, 9.0, 9.0, 11.0, 17.0, 18.0, 27.0, 35.0, 30.0, 27.0, 45.0, 38.0, 41.0, 34.0, 38.0, 52.0, 44.0, 41.0, 53.0, 51.0, 40.0, 40.0, 38.0, 45.0, 22.0, 20.0, 28.0, 31.0, 17.0, 14.0, 11.0, 13.0, 5.0, 7.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.92521667480469, -88.2435302734375, -85.56185150146484, -82.88017272949219, -80.198486328125, -77.51679992675781, -74.83512115478516, -72.1534423828125, -69.47175598144531, -66.79006958007812, -64.10839080810547, -61.42670822143555, -58.745025634765625, -56.0633430480957, -53.38166046142578, -50.69997787475586, -48.01829528808594, -45.336612701416016, -42.654930114746094, -39.97324752807617, -37.29156494140625, -34.60988235473633, -31.928199768066406, -29.246517181396484, -26.564834594726562, -23.88315200805664, -21.20146942138672, -18.519786834716797, -15.838104248046875, -13.156421661376953, -10.474739074707031, -7.793056488037109, -5.111366271972656, -2.4296836853027344, 0.2519989013671875, 2.9336814880371094, 5.615364074707031, 8.297046661376953, 10.978729248046875, 13.660411834716797, 16.34209442138672, 19.02377700805664, 21.705459594726562, 24.387142181396484, 27.068824768066406, 29.750507354736328, 32.43218994140625, 35.11387252807617, 37.795555114746094, 40.477237701416016, 43.15892028808594, 45.84060287475586, 48.52228546142578, 51.2039680480957, 53.885650634765625, 56.56733322143555, 59.24901580810547, 61.93069839477539, 64.61238098144531, 67.2940673828125, 69.97574615478516, 72.65742492675781, 75.339111328125, 78.02079772949219, 80.70247650146484]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 10.0, 15.0, 20.0, 32.0, 67.0, 103.0, 200.0, 504.0, 1018.0, 2261.0, 5891.0, 17608.0, 70589.0, 730587.0, 3214596.0, 111527.0, 25110.0, 8064.0, 3359.0, 1385.0, 665.0, 330.0, 159.0, 77.0, 44.0, 22.0, 15.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.03125, -38.033935546875, -37.03662109375, -36.039306640625, -35.0419921875, -34.044677734375, -33.04736328125, -32.050048828125, -31.052734375, -30.055419921875, -29.05810546875, -28.060791015625, -27.0634765625, -26.066162109375, -25.06884765625, -24.071533203125, -23.07421875, -22.076904296875, -21.07958984375, -20.082275390625, -19.0849609375, -18.087646484375, -17.09033203125, -16.093017578125, -15.095703125, -14.098388671875, -13.10107421875, -12.103759765625, -11.1064453125, -10.109130859375, -9.11181640625, -8.114501953125, -7.1171875, -6.119873046875, -5.12255859375, -4.125244140625, -3.1279296875, -2.130615234375, -1.13330078125, -0.135986328125, 0.861328125, 1.858642578125, 2.85595703125, 3.853271484375, 4.8505859375, 5.847900390625, 6.84521484375, 7.842529296875, 8.83984375, 9.837158203125, 10.83447265625, 11.831787109375, 12.8291015625, 13.826416015625, 14.82373046875, 15.821044921875, 16.818359375, 17.815673828125, 18.81298828125, 19.810302734375, 20.8076171875, 21.804931640625, 22.80224609375, 23.799560546875, 24.796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 4.0, 15.0, 16.0, 25.0, 31.0, 28.0, 36.0, 31.0, 44.0, 51.0, 46.0, 60.0, 42.0, 47.0, 48.0, 58.0, 55.0, 46.0, 42.0, 35.0, 43.0, 26.0, 26.0, 27.0, 20.0, 13.0, 9.0, 10.0, 13.0, 4.0, 8.0, 8.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.081695556640625, -2.98565673828125, -2.889617919921875, -2.7935791015625, -2.697540283203125, -2.60150146484375, -2.505462646484375, -2.409423828125, -2.313385009765625, -2.21734619140625, -2.121307373046875, -2.0252685546875, -1.929229736328125, -1.83319091796875, -1.737152099609375, -1.64111328125, -1.545074462890625, -1.44903564453125, -1.352996826171875, -1.2569580078125, -1.160919189453125, -1.06488037109375, -0.968841552734375, -0.872802734375, -0.776763916015625, -0.68072509765625, -0.584686279296875, -0.4886474609375, -0.392608642578125, -0.29656982421875, -0.200531005859375, -0.1044921875, -0.008453369140625, 0.08758544921875, 0.183624267578125, 0.2796630859375, 0.375701904296875, 0.47174072265625, 0.567779541015625, 0.663818359375, 0.759857177734375, 0.85589599609375, 0.951934814453125, 1.0479736328125, 1.144012451171875, 1.24005126953125, 1.336090087890625, 1.43212890625, 1.528167724609375, 1.62420654296875, 1.720245361328125, 1.8162841796875, 1.912322998046875, 2.00836181640625, 2.104400634765625, 2.200439453125, 2.296478271484375, 2.39251708984375, 2.488555908203125, 2.5845947265625, 2.680633544921875, 2.77667236328125, 2.872711181640625, 2.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 10.0, 8.0, 12.0, 15.0, 15.0, 26.0, 33.0, 55.0, 86.0, 132.0, 215.0, 365.0, 592.0, 1204.0, 2277.0, 4653.0, 10766.0, 27214.0, 77887.0, 277390.0, 2438005.0, 1068519.0, 190012.0, 57828.0, 20613.0, 8569.0, 3807.0, 1781.0, 940.0, 501.0, 319.0, 150.0, 92.0, 65.0, 38.0, 27.0, 20.0, 16.0, 4.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.591552734375, -15.01123046875, -14.430908203125, -13.8505859375, -13.270263671875, -12.68994140625, -12.109619140625, -11.529296875, -10.948974609375, -10.36865234375, -9.788330078125, -9.2080078125, -8.627685546875, -8.04736328125, -7.467041015625, -6.88671875, -6.306396484375, -5.72607421875, -5.145751953125, -4.5654296875, -3.985107421875, -3.40478515625, -2.824462890625, -2.244140625, -1.663818359375, -1.08349609375, -0.503173828125, 0.0771484375, 0.657470703125, 1.23779296875, 1.818115234375, 2.3984375, 2.978759765625, 3.55908203125, 4.139404296875, 4.7197265625, 5.300048828125, 5.88037109375, 6.460693359375, 7.041015625, 7.621337890625, 8.20166015625, 8.781982421875, 9.3623046875, 9.942626953125, 10.52294921875, 11.103271484375, 11.68359375, 12.263916015625, 12.84423828125, 13.424560546875, 14.0048828125, 14.585205078125, 15.16552734375, 15.745849609375, 16.326171875, 16.906494140625, 17.48681640625, 18.067138671875, 18.6474609375, 19.227783203125, 19.80810546875, 20.388427734375, 20.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 11.0, 3.0, 11.0, 12.0, 17.0, 27.0, 47.0, 70.0, 75.0, 86.0, 110.0, 162.0, 274.0, 438.0, 1137.0, 580.0, 307.0, 185.0, 129.0, 81.0, 80.0, 58.0, 40.0, 28.0, 19.0, 19.0, 10.0, 13.0, 6.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.4921875, -5.32904052734375, -5.1658935546875, -5.00274658203125, -4.839599609375, -4.67645263671875, -4.5133056640625, -4.35015869140625, -4.18701171875, -4.02386474609375, -3.8607177734375, -3.69757080078125, -3.534423828125, -3.37127685546875, -3.2081298828125, -3.04498291015625, -2.8818359375, -2.71868896484375, -2.5555419921875, -2.39239501953125, -2.229248046875, -2.06610107421875, -1.9029541015625, -1.73980712890625, -1.57666015625, -1.41351318359375, -1.2503662109375, -1.08721923828125, -0.924072265625, -0.76092529296875, -0.5977783203125, -0.43463134765625, -0.271484375, -0.10833740234375, 0.0548095703125, 0.21795654296875, 0.381103515625, 0.54425048828125, 0.7073974609375, 0.87054443359375, 1.03369140625, 1.19683837890625, 1.3599853515625, 1.52313232421875, 1.686279296875, 1.84942626953125, 2.0125732421875, 2.17572021484375, 2.3388671875, 2.50201416015625, 2.6651611328125, 2.82830810546875, 2.991455078125, 3.15460205078125, 3.3177490234375, 3.48089599609375, 3.64404296875, 3.80718994140625, 3.9703369140625, 4.13348388671875, 4.296630859375, 4.45977783203125, 4.6229248046875, 4.78607177734375, 4.94921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 21.0, 30.0, 48.0, 100.0, 111.0, 145.0, 165.0, 158.0, 84.0, 59.0, 34.0, 21.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-92.56082153320312, -90.71758270263672, -88.87434387207031, -87.03111267089844, -85.18787384033203, -83.34463500976562, -81.50139617919922, -79.65815734863281, -77.8149185180664, -75.9716796875, -74.1284408569336, -72.28520202636719, -70.44197082519531, -68.5987319946289, -66.7554931640625, -64.9122543334961, -63.06901931762695, -61.22578048706055, -59.382545471191406, -57.539306640625, -55.696067810058594, -53.85282897949219, -52.00959396362305, -50.16635513305664, -48.3231201171875, -46.479881286621094, -44.63664627075195, -42.79340744018555, -40.95016860961914, -39.10693359375, -37.263694763183594, -35.42045593261719, -33.57721710205078, -31.733980178833008, -29.8907413482666, -28.047504425048828, -26.204265594482422, -24.36102867126465, -22.517791748046875, -20.67455291748047, -18.831315994262695, -16.988079071044922, -15.144840240478516, -13.301603317260742, -11.458365440368652, -9.615127563476562, -7.771890640258789, -5.928652763366699, -4.085414886474609, -2.2421772480010986, -0.3989396095275879, 1.4442977905273438, 3.2875356674194336, 5.130773544311523, 6.974010467529297, 8.817248344421387, 10.660486221313477, 12.503724098205566, 14.346961975097656, 16.19019889831543, 18.033435821533203, 19.87667465209961, 21.719911575317383, 23.563148498535156, 25.406387329101562]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 17.0, 14.0, 16.0, 11.0, 23.0, 28.0, 29.0, 28.0, 35.0, 35.0, 29.0, 37.0, 54.0, 38.0, 43.0, 43.0, 46.0, 38.0, 36.0, 32.0, 40.0, 40.0, 48.0, 32.0, 26.0, 39.0, 20.0, 12.0, 16.0, 11.0, 8.0, 4.0, 11.0, 8.0, 5.0, 7.0, 4.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.20660400390625, -21.53872299194336, -20.870840072631836, -20.202959060668945, -19.535078048706055, -18.86719512939453, -18.19931411743164, -17.53143310546875, -16.863550186157227, -16.195669174194336, -15.527787208557129, -14.859905242919922, -14.192023277282715, -13.524141311645508, -12.856260299682617, -12.18837833404541, -11.52049732208252, -10.852615356445312, -10.184734344482422, -9.516852378845215, -8.848970413208008, -8.181089401245117, -7.51320743560791, -6.845325469970703, -6.177443981170654, -5.5095624923706055, -4.841680526733398, -4.17379903793335, -3.5059173107147217, -2.8380355834960938, -2.170154094696045, -1.502272129058838, -0.8343906402587891, -0.1665089726448059, 0.5013726949691772, 1.1692543029785156, 1.8371360301971436, 2.5050177574157715, 3.1728992462158203, 3.8407812118530273, 4.508662700653076, 5.176544189453125, 5.844426155090332, 6.512307643890381, 7.18018913269043, 7.848071098327637, 8.515953063964844, 9.183834075927734, 9.851716041564941, 10.519598007202148, 11.187479019165039, 11.855360984802246, 12.523242950439453, 13.191123962402344, 13.85900592803955, 14.526887893676758, 15.194768905639648, 15.862650871276855, 16.530532836914062, 17.198413848876953, 17.866294860839844, 18.534177780151367, 19.202058792114258, 19.86994171142578, 20.537822723388672]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 12.0, 19.0, 26.0, 33.0, 52.0, 109.0, 151.0, 276.0, 467.0, 844.0, 1494.0, 2945.0, 5712.0, 12337.0, 27901.0, 63312.0, 138802.0, 252186.0, 261544.0, 152215.0, 70477.0, 30570.0, 13598.0, 6409.0, 3223.0, 1620.0, 880.0, 507.0, 317.0, 171.0, 132.0, 73.0, 40.0, 25.0, 18.0, 23.0, 3.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-16.40625, -15.9752197265625, -15.544189453125, -15.1131591796875, -14.68212890625, -14.2510986328125, -13.820068359375, -13.3890380859375, -12.9580078125, -12.5269775390625, -12.095947265625, -11.6649169921875, -11.23388671875, -10.8028564453125, -10.371826171875, -9.9407958984375, -9.509765625, -9.0787353515625, -8.647705078125, -8.2166748046875, -7.78564453125, -7.3546142578125, -6.923583984375, -6.4925537109375, -6.0615234375, -5.6304931640625, -5.199462890625, -4.7684326171875, -4.33740234375, -3.9063720703125, -3.475341796875, -3.0443115234375, -2.61328125, -2.1822509765625, -1.751220703125, -1.3201904296875, -0.88916015625, -0.4581298828125, -0.027099609375, 0.4039306640625, 0.8349609375, 1.2659912109375, 1.697021484375, 2.1280517578125, 2.55908203125, 2.9901123046875, 3.421142578125, 3.8521728515625, 4.283203125, 4.7142333984375, 5.145263671875, 5.5762939453125, 6.00732421875, 6.4383544921875, 6.869384765625, 7.3004150390625, 7.7314453125, 8.1624755859375, 8.593505859375, 9.0245361328125, 9.45556640625, 9.8865966796875, 10.317626953125, 10.7486572265625, 11.1796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 13.0, 20.0, 33.0, 25.0, 24.0, 31.0, 35.0, 46.0, 39.0, 48.0, 59.0, 48.0, 47.0, 53.0, 51.0, 38.0, 46.0, 45.0, 37.0, 35.0, 30.0, 26.0, 20.0, 15.0, 17.0, 18.0, 21.0, 8.0, 8.0, 2.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62109375, -2.52734375, -2.43359375, -2.33984375, -2.24609375, -2.15234375, -2.05859375, -1.96484375, -1.87109375, -1.77734375, -1.68359375, -1.58984375, -1.49609375, -1.40234375, -1.30859375, -1.21484375, -1.12109375, -1.02734375, -0.93359375, -0.83984375, -0.74609375, -0.65234375, -0.55859375, -0.46484375, -0.37109375, -0.27734375, -0.18359375, -0.08984375, 0.00390625, 0.09765625, 0.19140625, 0.28515625, 0.37890625, 0.47265625, 0.56640625, 0.66015625, 0.75390625, 0.84765625, 0.94140625, 1.03515625, 1.12890625, 1.22265625, 1.31640625, 1.41015625, 1.50390625, 1.59765625, 1.69140625, 1.78515625, 1.87890625, 1.97265625, 2.06640625, 2.16015625, 2.25390625, 2.34765625, 2.44140625, 2.53515625, 2.62890625, 2.72265625, 2.81640625, 2.91015625, 3.00390625, 3.09765625, 3.19140625, 3.28515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 11.0, 7.0, 17.0, 11.0, 16.0, 36.0, 40.0, 60.0, 76.0, 118.0, 131.0, 181.0, 247.0, 351.0, 517.0, 817.0, 1472.0, 3274.0, 8241.0, 24338.0, 79119.0, 240144.0, 387550.0, 202691.0, 65343.0, 20237.0, 6950.0, 2751.0, 1350.0, 754.0, 484.0, 328.0, 227.0, 165.0, 134.0, 103.0, 62.0, 52.0, 40.0, 26.0, 17.0, 19.0, 12.0, 10.0, 5.0, 11.0, 2.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.03125, -16.505859375, -15.98046875, -15.455078125, -14.9296875, -14.404296875, -13.87890625, -13.353515625, -12.828125, -12.302734375, -11.77734375, -11.251953125, -10.7265625, -10.201171875, -9.67578125, -9.150390625, -8.625, -8.099609375, -7.57421875, -7.048828125, -6.5234375, -5.998046875, -5.47265625, -4.947265625, -4.421875, -3.896484375, -3.37109375, -2.845703125, -2.3203125, -1.794921875, -1.26953125, -0.744140625, -0.21875, 0.306640625, 0.83203125, 1.357421875, 1.8828125, 2.408203125, 2.93359375, 3.458984375, 3.984375, 4.509765625, 5.03515625, 5.560546875, 6.0859375, 6.611328125, 7.13671875, 7.662109375, 8.1875, 8.712890625, 9.23828125, 9.763671875, 10.2890625, 10.814453125, 11.33984375, 11.865234375, 12.390625, 12.916015625, 13.44140625, 13.966796875, 14.4921875, 15.017578125, 15.54296875, 16.068359375, 16.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 9.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 21.0, 11.0, 18.0, 13.0, 26.0, 23.0, 19.0, 27.0, 24.0, 30.0, 46.0, 39.0, 32.0, 43.0, 36.0, 32.0, 44.0, 38.0, 33.0, 54.0, 39.0, 36.0, 39.0, 26.0, 32.0, 26.0, 33.0, 24.0, 14.0, 15.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.6328125, -13.2420654296875, -12.851318359375, -12.4605712890625, -12.06982421875, -11.6790771484375, -11.288330078125, -10.8975830078125, -10.5068359375, -10.1160888671875, -9.725341796875, -9.3345947265625, -8.94384765625, -8.5531005859375, -8.162353515625, -7.7716064453125, -7.380859375, -6.9901123046875, -6.599365234375, -6.2086181640625, -5.81787109375, -5.4271240234375, -5.036376953125, -4.6456298828125, -4.2548828125, -3.8641357421875, -3.473388671875, -3.0826416015625, -2.69189453125, -2.3011474609375, -1.910400390625, -1.5196533203125, -1.12890625, -0.7381591796875, -0.347412109375, 0.0433349609375, 0.43408203125, 0.8248291015625, 1.215576171875, 1.6063232421875, 1.9970703125, 2.3878173828125, 2.778564453125, 3.1693115234375, 3.56005859375, 3.9508056640625, 4.341552734375, 4.7322998046875, 5.123046875, 5.5137939453125, 5.904541015625, 6.2952880859375, 6.68603515625, 7.0767822265625, 7.467529296875, 7.8582763671875, 8.2490234375, 8.6397705078125, 9.030517578125, 9.4212646484375, 9.81201171875, 10.2027587890625, 10.593505859375, 10.9842529296875, 11.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 3.0, 8.0, 16.0, 11.0, 11.0, 34.0, 47.0, 63.0, 84.0, 147.0, 229.0, 408.0, 704.0, 1397.0, 2943.0, 6942.0, 19973.0, 75340.0, 313443.0, 443586.0, 132638.0, 32367.0, 10162.0, 4029.0, 1762.0, 929.0, 494.0, 279.0, 169.0, 95.0, 66.0, 59.0, 37.0, 23.0, 18.0, 8.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.173828125, -9.84765625, -9.521484375, -9.1953125, -8.869140625, -8.54296875, -8.216796875, -7.890625, -7.564453125, -7.23828125, -6.912109375, -6.5859375, -6.259765625, -5.93359375, -5.607421875, -5.28125, -4.955078125, -4.62890625, -4.302734375, -3.9765625, -3.650390625, -3.32421875, -2.998046875, -2.671875, -2.345703125, -2.01953125, -1.693359375, -1.3671875, -1.041015625, -0.71484375, -0.388671875, -0.0625, 0.263671875, 0.58984375, 0.916015625, 1.2421875, 1.568359375, 1.89453125, 2.220703125, 2.546875, 2.873046875, 3.19921875, 3.525390625, 3.8515625, 4.177734375, 4.50390625, 4.830078125, 5.15625, 5.482421875, 5.80859375, 6.134765625, 6.4609375, 6.787109375, 7.11328125, 7.439453125, 7.765625, 8.091796875, 8.41796875, 8.744140625, 9.0703125, 9.396484375, 9.72265625, 10.048828125, 10.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 2.0, 11.0, 13.0, 14.0, 26.0, 32.0, 64.0, 90.0, 101.0, 145.0, 161.0, 106.0, 83.0, 47.0, 39.0, 24.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002864837646484375, -0.002793237566947937, -0.002721637487411499, -0.002650037407875061, -0.002578437328338623, -0.002506837248802185, -0.002435237169265747, -0.002363637089729309, -0.002292037010192871, -0.002220436930656433, -0.002148836851119995, -0.002077236771583557, -0.002005636692047119, -0.0019340366125106812, -0.0018624365329742432, -0.0017908364534378052, -0.0017192363739013672, -0.0016476362943649292, -0.0015760362148284912, -0.0015044361352920532, -0.0014328360557556152, -0.0013612359762191772, -0.0012896358966827393, -0.0012180358171463013, -0.0011464357376098633, -0.0010748356580734253, -0.0010032355785369873, -0.0009316354990005493, -0.0008600354194641113, -0.0007884353399276733, -0.0007168352603912354, -0.0006452351808547974, -0.0005736351013183594, -0.0005020350217819214, -0.0004304349422454834, -0.0003588348627090454, -0.0002872347831726074, -0.00021563470363616943, -0.00014403462409973145, -7.243454456329346e-05, -8.344650268554688e-07, 7.076561450958252e-05, 0.0001423656940460205, 0.0002139657735824585, 0.0002855658531188965, 0.00035716593265533447, 0.00042876601219177246, 0.0005003660917282104, 0.0005719661712646484, 0.0006435662508010864, 0.0007151663303375244, 0.0007867664098739624, 0.0008583664894104004, 0.0009299665689468384, 0.0010015666484832764, 0.0010731667280197144, 0.0011447668075561523, 0.0012163668870925903, 0.0012879669666290283, 0.0013595670461654663, 0.0014311671257019043, 0.0015027672052383423, 0.0015743672847747803, 0.0016459673643112183, 0.0017175674438476562]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 14.0, 12.0, 9.0, 20.0, 31.0, 50.0, 58.0, 100.0, 160.0, 266.0, 464.0, 880.0, 2031.0, 4737.0, 14952.0, 68718.0, 385709.0, 454937.0, 87472.0, 18147.0, 5442.0, 2087.0, 1001.0, 487.0, 246.0, 176.0, 90.0, 73.0, 45.0, 40.0, 23.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.59375, -12.1749267578125, -11.756103515625, -11.3372802734375, -10.91845703125, -10.4996337890625, -10.080810546875, -9.6619873046875, -9.2431640625, -8.8243408203125, -8.405517578125, -7.9866943359375, -7.56787109375, -7.1490478515625, -6.730224609375, -6.3114013671875, -5.892578125, -5.4737548828125, -5.054931640625, -4.6361083984375, -4.21728515625, -3.7984619140625, -3.379638671875, -2.9608154296875, -2.5419921875, -2.1231689453125, -1.704345703125, -1.2855224609375, -0.86669921875, -0.4478759765625, -0.029052734375, 0.3897705078125, 0.80859375, 1.2274169921875, 1.646240234375, 2.0650634765625, 2.48388671875, 2.9027099609375, 3.321533203125, 3.7403564453125, 4.1591796875, 4.5780029296875, 4.996826171875, 5.4156494140625, 5.83447265625, 6.2532958984375, 6.672119140625, 7.0909423828125, 7.509765625, 7.9285888671875, 8.347412109375, 8.7662353515625, 9.18505859375, 9.6038818359375, 10.022705078125, 10.4415283203125, 10.8603515625, 11.2791748046875, 11.697998046875, 12.1168212890625, 12.53564453125, 12.9544677734375, 13.373291015625, 13.7921142578125, 14.2109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 9.0, 2.0, 5.0, 5.0, 10.0, 7.0, 14.0, 13.0, 17.0, 15.0, 24.0, 29.0, 31.0, 34.0, 44.0, 49.0, 56.0, 84.0, 67.0, 66.0, 71.0, 64.0, 49.0, 33.0, 34.0, 30.0, 25.0, 22.0, 17.0, 12.0, 8.0, 12.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.01953125, -6.838134765625, -6.65673828125, -6.475341796875, -6.2939453125, -6.112548828125, -5.93115234375, -5.749755859375, -5.568359375, -5.386962890625, -5.20556640625, -5.024169921875, -4.8427734375, -4.661376953125, -4.47998046875, -4.298583984375, -4.1171875, -3.935791015625, -3.75439453125, -3.572998046875, -3.3916015625, -3.210205078125, -3.02880859375, -2.847412109375, -2.666015625, -2.484619140625, -2.30322265625, -2.121826171875, -1.9404296875, -1.759033203125, -1.57763671875, -1.396240234375, -1.21484375, -1.033447265625, -0.85205078125, -0.670654296875, -0.4892578125, -0.307861328125, -0.12646484375, 0.054931640625, 0.236328125, 0.417724609375, 0.59912109375, 0.780517578125, 0.9619140625, 1.143310546875, 1.32470703125, 1.506103515625, 1.6875, 1.868896484375, 2.05029296875, 2.231689453125, 2.4130859375, 2.594482421875, 2.77587890625, 2.957275390625, 3.138671875, 3.320068359375, 3.50146484375, 3.682861328125, 3.8642578125, 4.045654296875, 4.22705078125, 4.408447265625, 4.58984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 23.0, 28.0, 74.0, 109.0, 181.0, 190.0, 167.0, 121.0, 67.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-231.29701232910156, -225.31338500976562, -219.32974243164062, -213.34609985351562, -207.3624725341797, -201.37884521484375, -195.39520263671875, -189.41156005859375, -183.4279327392578, -177.44430541992188, -171.46066284179688, -165.47702026367188, -159.49339294433594, -153.509765625, -147.526123046875, -141.54248046875, -135.55885314941406, -129.57522583007812, -123.59158325195312, -117.60794830322266, -111.62431335449219, -105.64067840576172, -99.65704345703125, -93.67340850830078, -87.68977355957031, -81.70613861083984, -75.72250366210938, -69.7388687133789, -63.75523376464844, -57.77159881591797, -51.7879638671875, -45.80432891845703, -39.8206787109375, -33.83704376220703, -27.853408813476562, -21.869773864746094, -15.886138916015625, -9.902503967285156, -3.9188690185546875, 2.0647659301757812, 8.04840087890625, 14.032035827636719, 20.015670776367188, 25.999305725097656, 31.982940673828125, 37.966575622558594, 43.95021057128906, 49.93384552001953, 55.91748046875, 61.90111541748047, 67.88475036621094, 73.8683853149414, 79.85202026367188, 85.83565521240234, 91.81929016113281, 97.80292510986328, 103.78656005859375, 109.77019500732422, 115.75382995605469, 121.73746490478516, 127.72109985351562, 133.70474243164062, 139.68836975097656, 145.6719970703125, 151.6556396484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 11.0, 20.0, 23.0, 23.0, 32.0, 28.0, 36.0, 51.0, 52.0, 49.0, 41.0, 54.0, 46.0, 54.0, 56.0, 52.0, 47.0, 43.0, 31.0, 37.0, 30.0, 29.0, 24.0, 23.0, 20.0, 12.0, 12.0, 13.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.86239624023438, -75.18463897705078, -72.50687408447266, -69.82911682128906, -67.15135955810547, -64.47359466552734, -61.79583740234375, -59.11807632446289, -56.44031524658203, -53.76255416870117, -51.08479690551758, -48.40703582763672, -45.72927474975586, -43.051513671875, -40.373756408691406, -37.69599533081055, -35.01823806762695, -32.340476989746094, -29.662717819213867, -26.98495864868164, -24.30719757080078, -21.629438400268555, -18.951679229736328, -16.27391815185547, -13.596158981323242, -10.9183988571167, -8.240638732910156, -5.56287956237793, -2.8851194381713867, -0.20735931396484375, 2.470399856567383, 5.148160934448242, 7.825920104980469, 10.503680229187012, 13.181440353393555, 15.859199523925781, 18.53696060180664, 21.214719772338867, 23.892478942871094, 26.570240020751953, 29.24799919128418, 31.925758361816406, 34.603519439697266, 37.281280517578125, 39.95903778076172, 42.63679885864258, 45.31455993652344, 47.99231719970703, 50.67007827758789, 53.34783935546875, 56.025596618652344, 58.7033576965332, 61.38111877441406, 64.05887603759766, 66.73663330078125, 69.41439819335938, 72.09215545654297, 74.76991271972656, 77.44767761230469, 80.12543487548828, 82.80319213867188, 85.48095703125, 88.1587142944336, 90.83647155761719, 93.51423645019531]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 11.0, 11.0, 14.0, 24.0, 42.0, 58.0, 86.0, 118.0, 232.0, 326.0, 559.0, 988.0, 1790.0, 3384.0, 6574.0, 13549.0, 31488.0, 83918.0, 296046.0, 2758383.0, 750726.0, 152539.0, 51578.0, 20496.0, 9777.0, 4941.0, 2696.0, 1533.0, 854.0, 528.0, 352.0, 211.0, 147.0, 79.0, 63.0, 48.0, 34.0, 23.0, 14.0, 12.0, 8.0, 9.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.0625, -16.55712890625, -16.0517578125, -15.54638671875, -15.041015625, -14.53564453125, -14.0302734375, -13.52490234375, -13.01953125, -12.51416015625, -12.0087890625, -11.50341796875, -10.998046875, -10.49267578125, -9.9873046875, -9.48193359375, -8.9765625, -8.47119140625, -7.9658203125, -7.46044921875, -6.955078125, -6.44970703125, -5.9443359375, -5.43896484375, -4.93359375, -4.42822265625, -3.9228515625, -3.41748046875, -2.912109375, -2.40673828125, -1.9013671875, -1.39599609375, -0.890625, -0.38525390625, 0.1201171875, 0.62548828125, 1.130859375, 1.63623046875, 2.1416015625, 2.64697265625, 3.15234375, 3.65771484375, 4.1630859375, 4.66845703125, 5.173828125, 5.67919921875, 6.1845703125, 6.68994140625, 7.1953125, 7.70068359375, 8.2060546875, 8.71142578125, 9.216796875, 9.72216796875, 10.2275390625, 10.73291015625, 11.23828125, 11.74365234375, 12.2490234375, 12.75439453125, 13.259765625, 13.76513671875, 14.2705078125, 14.77587890625, 15.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 2.0, 6.0, 5.0, 6.0, 15.0, 21.0, 18.0, 17.0, 31.0, 27.0, 43.0, 36.0, 43.0, 52.0, 34.0, 47.0, 82.0, 53.0, 65.0, 52.0, 57.0, 37.0, 34.0, 29.0, 30.0, 22.0, 20.0, 32.0, 16.0, 15.0, 15.0, 6.0, 10.0, 12.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.882720947265625, -2.78497314453125, -2.687225341796875, -2.5894775390625, -2.491729736328125, -2.39398193359375, -2.296234130859375, -2.198486328125, -2.100738525390625, -2.00299072265625, -1.905242919921875, -1.8074951171875, -1.709747314453125, -1.61199951171875, -1.514251708984375, -1.41650390625, -1.318756103515625, -1.22100830078125, -1.123260498046875, -1.0255126953125, -0.927764892578125, -0.83001708984375, -0.732269287109375, -0.634521484375, -0.536773681640625, -0.43902587890625, -0.341278076171875, -0.2435302734375, -0.145782470703125, -0.04803466796875, 0.049713134765625, 0.1474609375, 0.245208740234375, 0.34295654296875, 0.440704345703125, 0.5384521484375, 0.636199951171875, 0.73394775390625, 0.831695556640625, 0.929443359375, 1.027191162109375, 1.12493896484375, 1.222686767578125, 1.3204345703125, 1.418182373046875, 1.51593017578125, 1.613677978515625, 1.71142578125, 1.809173583984375, 1.90692138671875, 2.004669189453125, 2.1024169921875, 2.200164794921875, 2.29791259765625, 2.395660400390625, 2.493408203125, 2.591156005859375, 2.68890380859375, 2.786651611328125, 2.8843994140625, 2.982147216796875, 3.07989501953125, 3.177642822265625, 3.275390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 16.0, 21.0, 30.0, 39.0, 66.0, 73.0, 94.0, 197.0, 338.0, 1029.0, 5150.0, 60832.0, 3448651.0, 652444.0, 21278.0, 2523.0, 644.0, 303.0, 152.0, 103.0, 85.0, 51.0, 40.0, 33.0, 29.0, 11.0, 14.0, 5.0, 7.0, 3.0, 4.0, 4.0, 5.0], "bins": [-68.375, -66.814208984375, -65.25341796875, -63.692626953125, -62.1318359375, -60.571044921875, -59.01025390625, -57.449462890625, -55.888671875, -54.327880859375, -52.76708984375, -51.206298828125, -49.6455078125, -48.084716796875, -46.52392578125, -44.963134765625, -43.40234375, -41.841552734375, -40.28076171875, -38.719970703125, -37.1591796875, -35.598388671875, -34.03759765625, -32.476806640625, -30.916015625, -29.355224609375, -27.79443359375, -26.233642578125, -24.6728515625, -23.112060546875, -21.55126953125, -19.990478515625, -18.4296875, -16.868896484375, -15.30810546875, -13.747314453125, -12.1865234375, -10.625732421875, -9.06494140625, -7.504150390625, -5.943359375, -4.382568359375, -2.82177734375, -1.260986328125, 0.2998046875, 1.860595703125, 3.42138671875, 4.982177734375, 6.54296875, 8.103759765625, 9.66455078125, 11.225341796875, 12.7861328125, 14.346923828125, 15.90771484375, 17.468505859375, 19.029296875, 20.590087890625, 22.15087890625, 23.711669921875, 25.2724609375, 26.833251953125, 28.39404296875, 29.954833984375, 31.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 17.0, 24.0, 47.0, 91.0, 164.0, 318.0, 748.0, 1413.0, 532.0, 313.0, 172.0, 85.0, 49.0, 33.0, 21.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.73760986328125, -5.3385009765625, -4.93939208984375, -4.540283203125, -4.14117431640625, -3.7420654296875, -3.34295654296875, -2.94384765625, -2.54473876953125, -2.1456298828125, -1.74652099609375, -1.347412109375, -0.94830322265625, -0.5491943359375, -0.15008544921875, 0.2490234375, 0.64813232421875, 1.0472412109375, 1.44635009765625, 1.845458984375, 2.24456787109375, 2.6436767578125, 3.04278564453125, 3.44189453125, 3.84100341796875, 4.2401123046875, 4.63922119140625, 5.038330078125, 5.43743896484375, 5.8365478515625, 6.23565673828125, 6.634765625, 7.03387451171875, 7.4329833984375, 7.83209228515625, 8.231201171875, 8.63031005859375, 9.0294189453125, 9.42852783203125, 9.82763671875, 10.22674560546875, 10.6258544921875, 11.02496337890625, 11.424072265625, 11.82318115234375, 12.2222900390625, 12.62139892578125, 13.0205078125, 13.41961669921875, 13.8187255859375, 14.21783447265625, 14.616943359375, 15.01605224609375, 15.4151611328125, 15.81427001953125, 16.21337890625, 16.61248779296875, 17.0115966796875, 17.41070556640625, 17.809814453125, 18.20892333984375, 18.6080322265625, 19.00714111328125, 19.40625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 15.0, 33.0, 65.0, 98.0, 140.0, 169.0, 154.0, 127.0, 96.0, 37.0, 24.0, 16.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.52430725097656, -116.35123443603516, -113.17815399169922, -110.00508117675781, -106.83200073242188, -103.65892791748047, -100.48585510253906, -97.31277465820312, -94.13970184326172, -90.96662902832031, -87.79354858398438, -84.62047576904297, -81.44740295410156, -78.27432250976562, -75.10124969482422, -71.92817687988281, -68.75509643554688, -65.58202362060547, -62.40894317626953, -59.235870361328125, -56.06279373168945, -52.88971710205078, -49.716644287109375, -46.5435676574707, -43.37049102783203, -40.19741439819336, -37.02433776855469, -33.85126495361328, -30.67818832397461, -27.505111694335938, -24.3320369720459, -21.15896224975586, -17.985885620117188, -14.812809944152832, -11.639734268188477, -8.466658592224121, -5.293582916259766, -2.12050724029541, 1.0525684356689453, 4.225643157958984, 7.398719787597656, 10.571795463562012, 13.744871139526367, 16.917945861816406, 20.091022491455078, 23.26409912109375, 26.43717384338379, 29.610248565673828, 32.7833251953125, 35.95640182495117, 39.129478454589844, 42.30255126953125, 45.47562789916992, 48.648704528808594, 51.82177734375, 54.99485397338867, 58.167930603027344, 61.341007232666016, 64.51408386230469, 67.6871566772461, 70.8602294921875, 74.03330993652344, 77.20638275146484, 80.37945556640625, 83.55253601074219]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 7.0, 13.0, 12.0, 11.0, 17.0, 27.0, 25.0, 37.0, 29.0, 40.0, 42.0, 31.0, 61.0, 54.0, 52.0, 46.0, 51.0, 50.0, 45.0, 41.0, 43.0, 38.0, 26.0, 36.0, 28.0, 20.0, 16.0, 13.0, 14.0, 16.0, 15.0, 10.0, 8.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.718284606933594, -33.530364990234375, -32.342445373535156, -31.15452766418457, -29.966609954833984, -28.778690338134766, -27.590770721435547, -26.402851104736328, -25.214933395385742, -24.027013778686523, -22.839096069335938, -21.65117645263672, -20.4632568359375, -19.275339126586914, -18.087419509887695, -16.89950180053711, -15.71158218383789, -14.523663520812988, -13.335744857788086, -12.147825241088867, -10.959906578063965, -9.771987915039062, -8.584068298339844, -7.396149635314941, -6.208230972290039, -5.020312309265137, -3.832393169403076, -2.6444742679595947, -1.4565553665161133, -0.26863670349121094, 0.9192824363708496, 2.10720157623291, 3.2951202392578125, 4.483038902282715, 5.670958042144775, 6.858877182006836, 8.046795845031738, 9.23471450805664, 10.42263412475586, 11.610552787780762, 12.798471450805664, 13.986390113830566, 15.174308776855469, 16.362228393554688, 17.550148010253906, 18.738065719604492, 19.92598533630371, 21.113903045654297, 22.301822662353516, 23.489742279052734, 24.67765998840332, 25.86557960510254, 27.053497314453125, 28.241416931152344, 29.429336547851562, 30.61725616455078, 31.805173873901367, 32.99309158325195, 34.18101119995117, 35.36893081665039, 36.55685043334961, 37.74476623535156, 38.93268585205078, 40.12060546875, 41.30852508544922]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 15.0, 10.0, 17.0, 20.0, 48.0, 48.0, 91.0, 138.0, 231.0, 373.0, 671.0, 1090.0, 2229.0, 4442.0, 9532.0, 21119.0, 47715.0, 105883.0, 222966.0, 308323.0, 174033.0, 81361.0, 36548.0, 16605.0, 7491.0, 3470.0, 1820.0, 925.0, 531.0, 312.0, 196.0, 102.0, 75.0, 41.0, 24.0, 23.0, 15.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8203125, -15.345703125, -14.87109375, -14.396484375, -13.921875, -13.447265625, -12.97265625, -12.498046875, -12.0234375, -11.548828125, -11.07421875, -10.599609375, -10.125, -9.650390625, -9.17578125, -8.701171875, -8.2265625, -7.751953125, -7.27734375, -6.802734375, -6.328125, -5.853515625, -5.37890625, -4.904296875, -4.4296875, -3.955078125, -3.48046875, -3.005859375, -2.53125, -2.056640625, -1.58203125, -1.107421875, -0.6328125, -0.158203125, 0.31640625, 0.791015625, 1.265625, 1.740234375, 2.21484375, 2.689453125, 3.1640625, 3.638671875, 4.11328125, 4.587890625, 5.0625, 5.537109375, 6.01171875, 6.486328125, 6.9609375, 7.435546875, 7.91015625, 8.384765625, 8.859375, 9.333984375, 9.80859375, 10.283203125, 10.7578125, 11.232421875, 11.70703125, 12.181640625, 12.65625, 13.130859375, 13.60546875, 14.080078125, 14.5546875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 17.0, 11.0, 23.0, 17.0, 27.0, 33.0, 19.0, 37.0, 30.0, 38.0, 46.0, 47.0, 49.0, 60.0, 61.0, 46.0, 43.0, 43.0, 40.0, 39.0, 33.0, 38.0, 25.0, 27.0, 14.0, 27.0, 18.0, 15.0, 13.0, 15.0, 6.0, 8.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.334197998046875, -2.24456787109375, -2.154937744140625, -2.0653076171875, -1.975677490234375, -1.88604736328125, -1.796417236328125, -1.706787109375, -1.617156982421875, -1.52752685546875, -1.437896728515625, -1.3482666015625, -1.258636474609375, -1.16900634765625, -1.079376220703125, -0.98974609375, -0.900115966796875, -0.81048583984375, -0.720855712890625, -0.6312255859375, -0.541595458984375, -0.45196533203125, -0.362335205078125, -0.272705078125, -0.183074951171875, -0.09344482421875, -0.003814697265625, 0.0858154296875, 0.175445556640625, 0.26507568359375, 0.354705810546875, 0.4443359375, 0.533966064453125, 0.62359619140625, 0.713226318359375, 0.8028564453125, 0.892486572265625, 0.98211669921875, 1.071746826171875, 1.161376953125, 1.251007080078125, 1.34063720703125, 1.430267333984375, 1.5198974609375, 1.609527587890625, 1.69915771484375, 1.788787841796875, 1.87841796875, 1.968048095703125, 2.05767822265625, 2.147308349609375, 2.2369384765625, 2.326568603515625, 2.41619873046875, 2.505828857421875, 2.595458984375, 2.685089111328125, 2.77471923828125, 2.864349365234375, 2.9539794921875, 3.043609619140625, 3.13323974609375, 3.222869873046875, 3.3125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 0.0, 8.0, 9.0, 9.0, 13.0, 20.0, 28.0, 27.0, 36.0, 44.0, 50.0, 79.0, 75.0, 115.0, 164.0, 164.0, 246.0, 366.0, 543.0, 833.0, 1383.0, 2520.0, 4933.0, 9875.0, 21844.0, 49167.0, 107570.0, 225417.0, 298251.0, 173958.0, 81041.0, 36286.0, 16369.0, 7588.0, 3840.0, 1982.0, 1159.0, 739.0, 505.0, 335.0, 253.0, 159.0, 122.0, 105.0, 79.0, 56.0, 50.0, 38.0, 27.0, 21.0, 14.0, 17.0, 8.0, 3.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0], "bins": [-11.59375, -11.2349853515625, -10.876220703125, -10.5174560546875, -10.15869140625, -9.7999267578125, -9.441162109375, -9.0823974609375, -8.7236328125, -8.3648681640625, -8.006103515625, -7.6473388671875, -7.28857421875, -6.9298095703125, -6.571044921875, -6.2122802734375, -5.853515625, -5.4947509765625, -5.135986328125, -4.7772216796875, -4.41845703125, -4.0596923828125, -3.700927734375, -3.3421630859375, -2.9833984375, -2.6246337890625, -2.265869140625, -1.9071044921875, -1.54833984375, -1.1895751953125, -0.830810546875, -0.4720458984375, -0.11328125, 0.2454833984375, 0.604248046875, 0.9630126953125, 1.32177734375, 1.6805419921875, 2.039306640625, 2.3980712890625, 2.7568359375, 3.1156005859375, 3.474365234375, 3.8331298828125, 4.19189453125, 4.5506591796875, 4.909423828125, 5.2681884765625, 5.626953125, 5.9857177734375, 6.344482421875, 6.7032470703125, 7.06201171875, 7.4207763671875, 7.779541015625, 8.1383056640625, 8.4970703125, 8.8558349609375, 9.214599609375, 9.5733642578125, 9.93212890625, 10.2908935546875, 10.649658203125, 11.0084228515625, 11.3671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 19.0, 41.0, 34.0, 40.0, 37.0, 41.0, 57.0, 42.0, 54.0, 44.0, 59.0, 56.0, 44.0, 37.0, 54.0, 44.0, 37.0, 21.0, 32.0, 19.0, 16.0, 14.0, 17.0, 17.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453125, -12.997802734375, -12.54248046875, -12.087158203125, -11.6318359375, -11.176513671875, -10.72119140625, -10.265869140625, -9.810546875, -9.355224609375, -8.89990234375, -8.444580078125, -7.9892578125, -7.533935546875, -7.07861328125, -6.623291015625, -6.16796875, -5.712646484375, -5.25732421875, -4.802001953125, -4.3466796875, -3.891357421875, -3.43603515625, -2.980712890625, -2.525390625, -2.070068359375, -1.61474609375, -1.159423828125, -0.7041015625, -0.248779296875, 0.20654296875, 0.661865234375, 1.1171875, 1.572509765625, 2.02783203125, 2.483154296875, 2.9384765625, 3.393798828125, 3.84912109375, 4.304443359375, 4.759765625, 5.215087890625, 5.67041015625, 6.125732421875, 6.5810546875, 7.036376953125, 7.49169921875, 7.947021484375, 8.40234375, 8.857666015625, 9.31298828125, 9.768310546875, 10.2236328125, 10.678955078125, 11.13427734375, 11.589599609375, 12.044921875, 12.500244140625, 12.95556640625, 13.410888671875, 13.8662109375, 14.321533203125, 14.77685546875, 15.232177734375, 15.6875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 13.0, 20.0, 34.0, 45.0, 67.0, 130.0, 234.0, 353.0, 689.0, 1337.0, 3090.0, 7960.0, 24572.0, 95402.0, 383326.0, 392536.0, 99049.0, 25246.0, 8244.0, 3180.0, 1357.0, 693.0, 379.0, 209.0, 134.0, 81.0, 50.0, 33.0, 18.0, 13.0, 12.0, 7.0, 8.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.9827880859375, -9.660888671875, -9.3389892578125, -9.01708984375, -8.6951904296875, -8.373291015625, -8.0513916015625, -7.7294921875, -7.4075927734375, -7.085693359375, -6.7637939453125, -6.44189453125, -6.1199951171875, -5.798095703125, -5.4761962890625, -5.154296875, -4.8323974609375, -4.510498046875, -4.1885986328125, -3.86669921875, -3.5447998046875, -3.222900390625, -2.9010009765625, -2.5791015625, -2.2572021484375, -1.935302734375, -1.6134033203125, -1.29150390625, -0.9696044921875, -0.647705078125, -0.3258056640625, -0.00390625, 0.3179931640625, 0.639892578125, 0.9617919921875, 1.28369140625, 1.6055908203125, 1.927490234375, 2.2493896484375, 2.5712890625, 2.8931884765625, 3.215087890625, 3.5369873046875, 3.85888671875, 4.1807861328125, 4.502685546875, 4.8245849609375, 5.146484375, 5.4683837890625, 5.790283203125, 6.1121826171875, 6.43408203125, 6.7559814453125, 7.077880859375, 7.3997802734375, 7.7216796875, 8.0435791015625, 8.365478515625, 8.6873779296875, 9.00927734375, 9.3311767578125, 9.653076171875, 9.9749755859375, 10.296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 16.0, 9.0, 23.0, 24.0, 28.0, 41.0, 28.0, 62.0, 57.0, 95.0, 125.0, 98.0, 73.0, 52.0, 45.0, 40.0, 21.0, 25.0, 21.0, 15.0, 13.0, 12.0, 11.0, 9.0, 3.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014162063598632812, -0.0013765394687652588, -0.0013368725776672363, -0.0012972056865692139, -0.0012575387954711914, -0.001217871904373169, -0.0011782050132751465, -0.001138538122177124, -0.0010988712310791016, -0.001059204339981079, -0.0010195374488830566, -0.0009798705577850342, -0.0009402036666870117, -0.0009005367755889893, -0.0008608698844909668, -0.0008212029933929443, -0.0007815361022949219, -0.0007418692111968994, -0.000702202320098877, -0.0006625354290008545, -0.000622868537902832, -0.0005832016468048096, -0.0005435347557067871, -0.0005038678646087646, -0.0004642009735107422, -0.0004245340824127197, -0.00038486719131469727, -0.0003452003002166748, -0.00030553340911865234, -0.0002658665180206299, -0.00022619962692260742, -0.00018653273582458496, -0.0001468658447265625, -0.00010719895362854004, -6.753206253051758e-05, -2.7865171432495117e-05, 1.1801719665527344e-05, 5.1468610763549805e-05, 9.113550186157227e-05, 0.00013080239295959473, 0.0001704692840576172, 0.00021013617515563965, 0.0002498030662536621, 0.00028946995735168457, 0.00032913684844970703, 0.0003688037395477295, 0.00040847063064575195, 0.0004481375217437744, 0.0004878044128417969, 0.0005274713039398193, 0.0005671381950378418, 0.0006068050861358643, 0.0006464719772338867, 0.0006861388683319092, 0.0007258057594299316, 0.0007654726505279541, 0.0008051395416259766, 0.000844806432723999, 0.0008844733238220215, 0.0009241402149200439, 0.0009638071060180664, 0.0010034739971160889, 0.0010431408882141113, 0.0010828077793121338, 0.0011224746704101562]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 11.0, 16.0, 19.0, 26.0, 43.0, 93.0, 161.0, 321.0, 596.0, 1213.0, 2848.0, 8064.0, 28335.0, 133456.0, 528648.0, 270948.0, 52673.0, 13345.0, 4230.0, 1784.0, 803.0, 353.0, 215.0, 122.0, 66.0, 51.0, 31.0, 17.0, 19.0, 14.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.111083984375, -12.72216796875, -12.333251953125, -11.9443359375, -11.555419921875, -11.16650390625, -10.777587890625, -10.388671875, -9.999755859375, -9.61083984375, -9.221923828125, -8.8330078125, -8.444091796875, -8.05517578125, -7.666259765625, -7.27734375, -6.888427734375, -6.49951171875, -6.110595703125, -5.7216796875, -5.332763671875, -4.94384765625, -4.554931640625, -4.166015625, -3.777099609375, -3.38818359375, -2.999267578125, -2.6103515625, -2.221435546875, -1.83251953125, -1.443603515625, -1.0546875, -0.665771484375, -0.27685546875, 0.112060546875, 0.5009765625, 0.889892578125, 1.27880859375, 1.667724609375, 2.056640625, 2.445556640625, 2.83447265625, 3.223388671875, 3.6123046875, 4.001220703125, 4.39013671875, 4.779052734375, 5.16796875, 5.556884765625, 5.94580078125, 6.334716796875, 6.7236328125, 7.112548828125, 7.50146484375, 7.890380859375, 8.279296875, 8.668212890625, 9.05712890625, 9.446044921875, 9.8349609375, 10.223876953125, 10.61279296875, 11.001708984375, 11.390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 14.0, 21.0, 19.0, 31.0, 35.0, 40.0, 58.0, 71.0, 88.0, 79.0, 96.0, 79.0, 75.0, 54.0, 52.0, 41.0, 29.0, 29.0, 12.0, 11.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.26953125, -7.0362548828125, -6.802978515625, -6.5697021484375, -6.33642578125, -6.1031494140625, -5.869873046875, -5.6365966796875, -5.4033203125, -5.1700439453125, -4.936767578125, -4.7034912109375, -4.47021484375, -4.2369384765625, -4.003662109375, -3.7703857421875, -3.537109375, -3.3038330078125, -3.070556640625, -2.8372802734375, -2.60400390625, -2.3707275390625, -2.137451171875, -1.9041748046875, -1.6708984375, -1.4376220703125, -1.204345703125, -0.9710693359375, -0.73779296875, -0.5045166015625, -0.271240234375, -0.0379638671875, 0.1953125, 0.4285888671875, 0.661865234375, 0.8951416015625, 1.12841796875, 1.3616943359375, 1.594970703125, 1.8282470703125, 2.0615234375, 2.2947998046875, 2.528076171875, 2.7613525390625, 2.99462890625, 3.2279052734375, 3.461181640625, 3.6944580078125, 3.927734375, 4.1610107421875, 4.394287109375, 4.6275634765625, 4.86083984375, 5.0941162109375, 5.327392578125, 5.5606689453125, 5.7939453125, 6.0272216796875, 6.260498046875, 6.4937744140625, 6.72705078125, 6.9603271484375, 7.193603515625, 7.4268798828125, 7.66015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 13.0, 11.0, 16.0, 31.0, 67.0, 104.0, 145.0, 162.0, 170.0, 133.0, 76.0, 36.0, 16.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.40904235839844, -167.1335906982422, -161.85813903808594, -156.5826873779297, -151.3072509765625, -146.03179931640625, -140.75634765625, -135.48089599609375, -130.2054443359375, -124.92999267578125, -119.654541015625, -114.37909698486328, -109.10364532470703, -103.82819366455078, -98.55274963378906, -93.27729797363281, -88.00184631347656, -82.72639465332031, -77.45094299316406, -72.17549896240234, -66.9000473022461, -61.624595642089844, -56.34914779663086, -51.073699951171875, -45.798248291015625, -40.522796630859375, -35.24734878540039, -29.971899032592773, -24.696449279785156, -19.42099952697754, -14.145549774169922, -8.870101928710938, -3.59466552734375, 1.6807842254638672, 6.956233978271484, 12.231683731079102, 17.50713348388672, 22.782583236694336, 28.058032989501953, 33.33348083496094, 38.60893249511719, 43.88438415527344, 49.15983200073242, 54.435279846191406, 59.710731506347656, 64.9861831665039, 70.26162719726562, 75.53707885742188, 80.81253051757812, 86.08798217773438, 91.36343383789062, 96.63887786865234, 101.9143295288086, 107.18978118896484, 112.46522521972656, 117.74067687988281, 123.01612854003906, 128.2915802001953, 133.56703186035156, 138.8424835205078, 144.117919921875, 149.39337158203125, 154.6688232421875, 159.94427490234375, 165.2197265625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 12.0, 8.0, 9.0, 19.0, 12.0, 18.0, 19.0, 19.0, 20.0, 26.0, 37.0, 39.0, 42.0, 29.0, 30.0, 35.0, 29.0, 38.0, 42.0, 40.0, 45.0, 38.0, 41.0, 36.0, 27.0, 28.0, 32.0, 21.0, 22.0, 20.0, 28.0, 21.0, 9.0, 17.0, 13.0, 9.0, 12.0, 6.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.08466339111328, -63.961360931396484, -61.83805847167969, -59.714759826660156, -57.59145736694336, -55.46815490722656, -53.34485626220703, -51.221553802490234, -49.09825134277344, -46.97494888305664, -44.851646423339844, -42.72834777832031, -40.605045318603516, -38.48174285888672, -36.35844421386719, -34.23514175415039, -32.111839294433594, -29.988536834716797, -27.865236282348633, -25.74193572998047, -23.618633270263672, -21.495330810546875, -19.37203025817871, -17.248729705810547, -15.12542724609375, -13.00212574005127, -10.878824234008789, -8.755522727966309, -6.632221221923828, -4.508919715881348, -2.385618209838867, -0.2623167037963867, 1.8609771728515625, 3.984278678894043, 6.107580184936523, 8.230881690979004, 10.354183197021484, 12.477484703063965, 14.600786209106445, 16.72408676147461, 18.847389221191406, 20.970691680908203, 23.093992233276367, 25.21729278564453, 27.340595245361328, 29.463897705078125, 31.58719825744629, 33.71049880981445, 35.83380126953125, 37.95710372924805, 40.080406188964844, 42.203704833984375, 44.32700729370117, 46.45030975341797, 48.5736083984375, 50.6969108581543, 52.820213317871094, 54.94351577758789, 57.06681823730469, 59.19011688232422, 61.313419342041016, 63.43672180175781, 65.56002044677734, 67.6833267211914, 69.80662536621094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 12.0, 14.0, 10.0, 28.0, 27.0, 39.0, 58.0, 96.0, 141.0, 206.0, 298.0, 451.0, 772.0, 1292.0, 2377.0, 4293.0, 8631.0, 17320.0, 41603.0, 128170.0, 1082907.0, 2659429.0, 157327.0, 47718.0, 20063.0, 9325.0, 4873.0, 2670.0, 1498.0, 933.0, 571.0, 360.0, 243.0, 163.0, 114.0, 75.0, 44.0, 37.0, 25.0, 18.0, 12.0, 12.0, 2.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.46875, -15.9708251953125, -15.472900390625, -14.9749755859375, -14.47705078125, -13.9791259765625, -13.481201171875, -12.9832763671875, -12.4853515625, -11.9874267578125, -11.489501953125, -10.9915771484375, -10.49365234375, -9.9957275390625, -9.497802734375, -8.9998779296875, -8.501953125, -8.0040283203125, -7.506103515625, -7.0081787109375, -6.51025390625, -6.0123291015625, -5.514404296875, -5.0164794921875, -4.5185546875, -4.0206298828125, -3.522705078125, -3.0247802734375, -2.52685546875, -2.0289306640625, -1.531005859375, -1.0330810546875, -0.53515625, -0.0372314453125, 0.460693359375, 0.9586181640625, 1.45654296875, 1.9544677734375, 2.452392578125, 2.9503173828125, 3.4482421875, 3.9461669921875, 4.444091796875, 4.9420166015625, 5.43994140625, 5.9378662109375, 6.435791015625, 6.9337158203125, 7.431640625, 7.9295654296875, 8.427490234375, 8.9254150390625, 9.42333984375, 9.9212646484375, 10.419189453125, 10.9171142578125, 11.4150390625, 11.9129638671875, 12.410888671875, 12.9088134765625, 13.40673828125, 13.9046630859375, 14.402587890625, 14.9005126953125, 15.3984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 4.0, 11.0, 10.0, 15.0, 17.0, 20.0, 17.0, 23.0, 25.0, 24.0, 41.0, 27.0, 52.0, 32.0, 61.0, 41.0, 33.0, 51.0, 51.0, 44.0, 39.0, 29.0, 39.0, 40.0, 34.0, 33.0, 16.0, 28.0, 16.0, 27.0, 11.0, 14.0, 13.0, 11.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.3699951171875, -2.284912109375, -2.1998291015625, -2.11474609375, -2.0296630859375, -1.944580078125, -1.8594970703125, -1.7744140625, -1.6893310546875, -1.604248046875, -1.5191650390625, -1.43408203125, -1.3489990234375, -1.263916015625, -1.1788330078125, -1.09375, -1.0086669921875, -0.923583984375, -0.8385009765625, -0.75341796875, -0.6683349609375, -0.583251953125, -0.4981689453125, -0.4130859375, -0.3280029296875, -0.242919921875, -0.1578369140625, -0.07275390625, 0.0123291015625, 0.097412109375, 0.1824951171875, 0.267578125, 0.3526611328125, 0.437744140625, 0.5228271484375, 0.60791015625, 0.6929931640625, 0.778076171875, 0.8631591796875, 0.9482421875, 1.0333251953125, 1.118408203125, 1.2034912109375, 1.28857421875, 1.3736572265625, 1.458740234375, 1.5438232421875, 1.62890625, 1.7139892578125, 1.799072265625, 1.8841552734375, 1.96923828125, 2.0543212890625, 2.139404296875, 2.2244873046875, 2.3095703125, 2.3946533203125, 2.479736328125, 2.5648193359375, 2.64990234375, 2.7349853515625, 2.820068359375, 2.9051513671875, 2.990234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 13.0, 30.0, 16.0, 28.0, 28.0, 34.0, 57.0, 67.0, 72.0, 82.0, 132.0, 272.0, 899.0, 3622.0, 22771.0, 278620.0, 3700009.0, 167118.0, 16214.0, 2712.0, 657.0, 237.0, 120.0, 82.0, 71.0, 56.0, 39.0, 35.0, 35.0, 22.0, 36.0, 14.0, 19.0, 10.0, 7.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -34.1279296875, -33.005859375, -31.8837890625, -30.76171875, -29.6396484375, -28.517578125, -27.3955078125, -26.2734375, -25.1513671875, -24.029296875, -22.9072265625, -21.78515625, -20.6630859375, -19.541015625, -18.4189453125, -17.296875, -16.1748046875, -15.052734375, -13.9306640625, -12.80859375, -11.6865234375, -10.564453125, -9.4423828125, -8.3203125, -7.1982421875, -6.076171875, -4.9541015625, -3.83203125, -2.7099609375, -1.587890625, -0.4658203125, 0.65625, 1.7783203125, 2.900390625, 4.0224609375, 5.14453125, 6.2666015625, 7.388671875, 8.5107421875, 9.6328125, 10.7548828125, 11.876953125, 12.9990234375, 14.12109375, 15.2431640625, 16.365234375, 17.4873046875, 18.609375, 19.7314453125, 20.853515625, 21.9755859375, 23.09765625, 24.2197265625, 25.341796875, 26.4638671875, 27.5859375, 28.7080078125, 29.830078125, 30.9521484375, 32.07421875, 33.1962890625, 34.318359375, 35.4404296875, 36.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 17.0, 12.0, 31.0, 82.0, 144.0, 420.0, 1957.0, 923.0, 263.0, 112.0, 53.0, 31.0, 17.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984375, -16.522705078125, -16.06103515625, -15.599365234375, -15.1376953125, -14.676025390625, -14.21435546875, -13.752685546875, -13.291015625, -12.829345703125, -12.36767578125, -11.906005859375, -11.4443359375, -10.982666015625, -10.52099609375, -10.059326171875, -9.59765625, -9.135986328125, -8.67431640625, -8.212646484375, -7.7509765625, -7.289306640625, -6.82763671875, -6.365966796875, -5.904296875, -5.442626953125, -4.98095703125, -4.519287109375, -4.0576171875, -3.595947265625, -3.13427734375, -2.672607421875, -2.2109375, -1.749267578125, -1.28759765625, -0.825927734375, -0.3642578125, 0.097412109375, 0.55908203125, 1.020751953125, 1.482421875, 1.944091796875, 2.40576171875, 2.867431640625, 3.3291015625, 3.790771484375, 4.25244140625, 4.714111328125, 5.17578125, 5.637451171875, 6.09912109375, 6.560791015625, 7.0224609375, 7.484130859375, 7.94580078125, 8.407470703125, 8.869140625, 9.330810546875, 9.79248046875, 10.254150390625, 10.7158203125, 11.177490234375, 11.63916015625, 12.100830078125, 12.5625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 13.0, 13.0, 12.0, 26.0, 52.0, 59.0, 98.0, 140.0, 147.0, 122.0, 117.0, 73.0, 49.0, 29.0, 23.0, 12.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.19105529785156, -72.3633041381836, -70.53555297851562, -68.70780181884766, -66.88005065917969, -65.05229187011719, -63.22454071044922, -61.39678955078125, -59.56903839111328, -57.74128723144531, -55.913536071777344, -54.08578109741211, -52.25802993774414, -50.43027877807617, -48.60252380371094, -46.77477264404297, -44.947021484375, -43.11927032470703, -41.29151916503906, -39.46376419067383, -37.63601303100586, -35.80826187133789, -33.980506896972656, -32.15275573730469, -30.32500457763672, -28.49725341796875, -26.66950035095215, -24.841747283935547, -23.013996124267578, -21.18624496459961, -19.358491897583008, -17.530738830566406, -15.702987670898438, -13.875235557556152, -12.047483444213867, -10.219731330871582, -8.391979217529297, -6.564227104187012, -4.736474990844727, -2.9087228775024414, -1.0809707641601562, 0.7467813491821289, 2.574533462524414, 4.402285575866699, 6.230037689208984, 8.05778980255127, 9.885541915893555, 11.71329402923584, 13.541046142578125, 15.36879825592041, 17.196550369262695, 19.024303436279297, 20.852054595947266, 22.679805755615234, 24.507558822631836, 26.335311889648438, 28.163063049316406, 29.990814208984375, 31.818567276000977, 33.64632034301758, 35.47407150268555, 37.301822662353516, 39.12957763671875, 40.95732879638672, 42.78507995605469]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 5.0, 14.0, 14.0, 12.0, 19.0, 14.0, 22.0, 25.0, 21.0, 33.0, 34.0, 32.0, 30.0, 29.0, 41.0, 30.0, 30.0, 35.0, 38.0, 41.0, 27.0, 52.0, 37.0, 36.0, 37.0, 22.0, 24.0, 25.0, 19.0, 25.0, 10.0, 19.0, 13.0, 12.0, 16.0, 11.0, 14.0, 8.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-20.922992706298828, -20.303266525268555, -19.683542251586914, -19.06381607055664, -18.444091796875, -17.824365615844727, -17.204641342163086, -16.584915161132812, -15.965190887451172, -15.345465660095215, -14.725740432739258, -14.1060152053833, -13.486289978027344, -12.866564750671387, -12.24683952331543, -11.627113342285156, -11.0073881149292, -10.387662887573242, -9.767937660217285, -9.148212432861328, -8.528487205505371, -7.908761978149414, -7.289036273956299, -6.669311046600342, -6.049585819244385, -5.429860591888428, -4.810135364532471, -4.1904096603393555, -3.5706846714019775, -2.9509594440460205, -2.3312339782714844, -1.7115087509155273, -1.0917835235595703, -0.4720582365989685, 0.1476670503616333, 0.7673923969268799, 1.387117624282837, 2.006842851638794, 2.62656831741333, 3.246293544769287, 3.866018772125244, 4.485743999481201, 5.105469226837158, 5.725194931030273, 6.3449201583862305, 6.9646453857421875, 7.5843706130981445, 8.204095840454102, 8.823821067810059, 9.443546295166016, 10.063271522521973, 10.68299674987793, 11.302721977233887, 11.922447204589844, 12.542173385620117, 13.161897659301758, 13.781623840332031, 14.401349067687988, 15.021074295043945, 15.640799522399902, 16.26052474975586, 16.880250930786133, 17.499975204467773, 18.119701385498047, 18.739425659179688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 7.0, 7.0, 11.0, 14.0, 10.0, 17.0, 29.0, 49.0, 52.0, 74.0, 124.0, 182.0, 286.0, 433.0, 613.0, 1004.0, 1570.0, 2702.0, 4802.0, 8567.0, 15385.0, 29035.0, 55184.0, 105526.0, 194999.0, 263603.0, 169983.0, 90984.0, 47380.0, 24866.0, 13229.0, 7357.0, 4101.0, 2465.0, 1400.0, 837.0, 534.0, 332.0, 266.0, 156.0, 109.0, 66.0, 56.0, 37.0, 28.0, 28.0, 12.0, 10.0, 14.0, 8.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.390625, -10.9892578125, -10.587890625, -10.1865234375, -9.78515625, -9.3837890625, -8.982421875, -8.5810546875, -8.1796875, -7.7783203125, -7.376953125, -6.9755859375, -6.57421875, -6.1728515625, -5.771484375, -5.3701171875, -4.96875, -4.5673828125, -4.166015625, -3.7646484375, -3.36328125, -2.9619140625, -2.560546875, -2.1591796875, -1.7578125, -1.3564453125, -0.955078125, -0.5537109375, -0.15234375, 0.2490234375, 0.650390625, 1.0517578125, 1.453125, 1.8544921875, 2.255859375, 2.6572265625, 3.05859375, 3.4599609375, 3.861328125, 4.2626953125, 4.6640625, 5.0654296875, 5.466796875, 5.8681640625, 6.26953125, 6.6708984375, 7.072265625, 7.4736328125, 7.875, 8.2763671875, 8.677734375, 9.0791015625, 9.48046875, 9.8818359375, 10.283203125, 10.6845703125, 11.0859375, 11.4873046875, 11.888671875, 12.2900390625, 12.69140625, 13.0927734375, 13.494140625, 13.8955078125, 14.296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 13.0, 18.0, 21.0, 18.0, 16.0, 19.0, 21.0, 35.0, 27.0, 38.0, 51.0, 45.0, 41.0, 47.0, 63.0, 39.0, 39.0, 48.0, 39.0, 41.0, 33.0, 37.0, 30.0, 23.0, 21.0, 23.0, 14.0, 19.0, 13.0, 19.0, 14.0, 13.0, 8.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.245452880859375, -2.16082763671875, -2.076202392578125, -1.9915771484375, -1.906951904296875, -1.82232666015625, -1.737701416015625, -1.653076171875, -1.568450927734375, -1.48382568359375, -1.399200439453125, -1.3145751953125, -1.229949951171875, -1.14532470703125, -1.060699462890625, -0.97607421875, -0.891448974609375, -0.80682373046875, -0.722198486328125, -0.6375732421875, -0.552947998046875, -0.46832275390625, -0.383697509765625, -0.299072265625, -0.214447021484375, -0.12982177734375, -0.045196533203125, 0.0394287109375, 0.124053955078125, 0.20867919921875, 0.293304443359375, 0.3779296875, 0.462554931640625, 0.54718017578125, 0.631805419921875, 0.7164306640625, 0.801055908203125, 0.88568115234375, 0.970306396484375, 1.054931640625, 1.139556884765625, 1.22418212890625, 1.308807373046875, 1.3934326171875, 1.478057861328125, 1.56268310546875, 1.647308349609375, 1.73193359375, 1.816558837890625, 1.90118408203125, 1.985809326171875, 2.0704345703125, 2.155059814453125, 2.23968505859375, 2.324310302734375, 2.408935546875, 2.493560791015625, 2.57818603515625, 2.662811279296875, 2.7474365234375, 2.832061767578125, 2.91668701171875, 3.001312255859375, 3.0859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 6.0, 10.0, 12.0, 18.0, 31.0, 31.0, 42.0, 53.0, 67.0, 92.0, 120.0, 159.0, 239.0, 308.0, 405.0, 650.0, 1153.0, 2378.0, 6360.0, 19346.0, 67781.0, 228191.0, 438523.0, 196951.0, 58092.0, 16723.0, 5441.0, 2190.0, 1083.0, 617.0, 374.0, 272.0, 206.0, 161.0, 99.0, 80.0, 60.0, 50.0, 34.0, 32.0, 28.0, 18.0, 21.0, 14.0, 4.0, 5.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-17.65625, -17.128173828125, -16.60009765625, -16.072021484375, -15.5439453125, -15.015869140625, -14.48779296875, -13.959716796875, -13.431640625, -12.903564453125, -12.37548828125, -11.847412109375, -11.3193359375, -10.791259765625, -10.26318359375, -9.735107421875, -9.20703125, -8.678955078125, -8.15087890625, -7.622802734375, -7.0947265625, -6.566650390625, -6.03857421875, -5.510498046875, -4.982421875, -4.454345703125, -3.92626953125, -3.398193359375, -2.8701171875, -2.342041015625, -1.81396484375, -1.285888671875, -0.7578125, -0.229736328125, 0.29833984375, 0.826416015625, 1.3544921875, 1.882568359375, 2.41064453125, 2.938720703125, 3.466796875, 3.994873046875, 4.52294921875, 5.051025390625, 5.5791015625, 6.107177734375, 6.63525390625, 7.163330078125, 7.69140625, 8.219482421875, 8.74755859375, 9.275634765625, 9.8037109375, 10.331787109375, 10.85986328125, 11.387939453125, 11.916015625, 12.444091796875, 12.97216796875, 13.500244140625, 14.0283203125, 14.556396484375, 15.08447265625, 15.612548828125, 16.140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 13.0, 8.0, 8.0, 13.0, 15.0, 23.0, 13.0, 21.0, 28.0, 27.0, 31.0, 34.0, 38.0, 50.0, 35.0, 41.0, 49.0, 42.0, 53.0, 29.0, 37.0, 35.0, 38.0, 29.0, 31.0, 29.0, 32.0, 32.0, 22.0, 17.0, 21.0, 14.0, 11.0, 16.0, 10.0, 13.0, 10.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.46875, -11.112060546875, -10.75537109375, -10.398681640625, -10.0419921875, -9.685302734375, -9.32861328125, -8.971923828125, -8.615234375, -8.258544921875, -7.90185546875, -7.545166015625, -7.1884765625, -6.831787109375, -6.47509765625, -6.118408203125, -5.76171875, -5.405029296875, -5.04833984375, -4.691650390625, -4.3349609375, -3.978271484375, -3.62158203125, -3.264892578125, -2.908203125, -2.551513671875, -2.19482421875, -1.838134765625, -1.4814453125, -1.124755859375, -0.76806640625, -0.411376953125, -0.0546875, 0.302001953125, 0.65869140625, 1.015380859375, 1.3720703125, 1.728759765625, 2.08544921875, 2.442138671875, 2.798828125, 3.155517578125, 3.51220703125, 3.868896484375, 4.2255859375, 4.582275390625, 4.93896484375, 5.295654296875, 5.65234375, 6.009033203125, 6.36572265625, 6.722412109375, 7.0791015625, 7.435791015625, 7.79248046875, 8.149169921875, 8.505859375, 8.862548828125, 9.21923828125, 9.575927734375, 9.9326171875, 10.289306640625, 10.64599609375, 11.002685546875, 11.359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 21.0, 24.0, 40.0, 77.0, 173.0, 394.0, 923.0, 2867.0, 10872.0, 63201.0, 521826.0, 389739.0, 45804.0, 8828.0, 2285.0, 809.0, 288.0, 125.0, 78.0, 42.0, 32.0, 19.0, 12.0, 4.0, 10.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.0682373046875, -13.581787109375, -13.0953369140625, -12.60888671875, -12.1224365234375, -11.635986328125, -11.1495361328125, -10.6630859375, -10.1766357421875, -9.690185546875, -9.2037353515625, -8.71728515625, -8.2308349609375, -7.744384765625, -7.2579345703125, -6.771484375, -6.2850341796875, -5.798583984375, -5.3121337890625, -4.82568359375, -4.3392333984375, -3.852783203125, -3.3663330078125, -2.8798828125, -2.3934326171875, -1.906982421875, -1.4205322265625, -0.93408203125, -0.4476318359375, 0.038818359375, 0.5252685546875, 1.01171875, 1.4981689453125, 1.984619140625, 2.4710693359375, 2.95751953125, 3.4439697265625, 3.930419921875, 4.4168701171875, 4.9033203125, 5.3897705078125, 5.876220703125, 6.3626708984375, 6.84912109375, 7.3355712890625, 7.822021484375, 8.3084716796875, 8.794921875, 9.2813720703125, 9.767822265625, 10.2542724609375, 10.74072265625, 11.2271728515625, 11.713623046875, 12.2000732421875, 12.6865234375, 13.1729736328125, 13.659423828125, 14.1458740234375, 14.63232421875, 15.1187744140625, 15.605224609375, 16.0916748046875, 16.578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 8.0, 16.0, 15.0, 21.0, 25.0, 34.0, 39.0, 39.0, 59.0, 83.0, 131.0, 147.0, 91.0, 51.0, 47.0, 36.0, 24.0, 25.0, 15.0, 18.0, 16.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.001386880874633789, -0.0013422966003417969, -0.0012977123260498047, -0.0012531280517578125, -0.0012085437774658203, -0.0011639595031738281, -0.001119375228881836, -0.0010747909545898438, -0.0010302066802978516, -0.0009856224060058594, -0.0009410381317138672, -0.000896453857421875, -0.0008518695831298828, -0.0008072853088378906, -0.0007627010345458984, -0.0007181167602539062, -0.0006735324859619141, -0.0006289482116699219, -0.0005843639373779297, -0.0005397796630859375, -0.0004951953887939453, -0.0004506111145019531, -0.00040602684020996094, -0.00036144256591796875, -0.00031685829162597656, -0.0002722740173339844, -0.0002276897430419922, -0.00018310546875, -0.0001385211944580078, -9.393692016601562e-05, -4.935264587402344e-05, -4.76837158203125e-06, 3.981590270996094e-05, 8.440017700195312e-05, 0.0001289844512939453, 0.0001735687255859375, 0.0002181529998779297, 0.0002627372741699219, 0.00030732154846191406, 0.00035190582275390625, 0.00039649009704589844, 0.0004410743713378906, 0.0004856586456298828, 0.000530242919921875, 0.0005748271942138672, 0.0006194114685058594, 0.0006639957427978516, 0.0007085800170898438, 0.0007531642913818359, 0.0007977485656738281, 0.0008423328399658203, 0.0008869171142578125, 0.0009315013885498047, 0.0009760856628417969, 0.001020669937133789, 0.0010652542114257812, 0.0011098384857177734, 0.0011544227600097656, 0.0011990070343017578, 0.00124359130859375, 0.0012881755828857422, 0.0013327598571777344, 0.0013773441314697266, 0.0014219284057617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 7.0, 10.0, 21.0, 19.0, 31.0, 46.0, 93.0, 126.0, 224.0, 427.0, 829.0, 1781.0, 4803.0, 19727.0, 168037.0, 721096.0, 109259.0, 14749.0, 4035.0, 1613.0, 692.0, 377.0, 188.0, 122.0, 74.0, 34.0, 32.0, 15.0, 18.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.46875, -17.916015625, -17.36328125, -16.810546875, -16.2578125, -15.705078125, -15.15234375, -14.599609375, -14.046875, -13.494140625, -12.94140625, -12.388671875, -11.8359375, -11.283203125, -10.73046875, -10.177734375, -9.625, -9.072265625, -8.51953125, -7.966796875, -7.4140625, -6.861328125, -6.30859375, -5.755859375, -5.203125, -4.650390625, -4.09765625, -3.544921875, -2.9921875, -2.439453125, -1.88671875, -1.333984375, -0.78125, -0.228515625, 0.32421875, 0.876953125, 1.4296875, 1.982421875, 2.53515625, 3.087890625, 3.640625, 4.193359375, 4.74609375, 5.298828125, 5.8515625, 6.404296875, 6.95703125, 7.509765625, 8.0625, 8.615234375, 9.16796875, 9.720703125, 10.2734375, 10.826171875, 11.37890625, 11.931640625, 12.484375, 13.037109375, 13.58984375, 14.142578125, 14.6953125, 15.248046875, 15.80078125, 16.353515625, 16.90625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 3.0, 14.0, 15.0, 21.0, 33.0, 47.0, 54.0, 83.0, 118.0, 107.0, 112.0, 98.0, 63.0, 51.0, 55.0, 27.0, 22.0, 13.0, 7.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3284912109375, -7.047607421875, -6.7667236328125, -6.48583984375, -6.2049560546875, -5.924072265625, -5.6431884765625, -5.3623046875, -5.0814208984375, -4.800537109375, -4.5196533203125, -4.23876953125, -3.9578857421875, -3.677001953125, -3.3961181640625, -3.115234375, -2.8343505859375, -2.553466796875, -2.2725830078125, -1.99169921875, -1.7108154296875, -1.429931640625, -1.1490478515625, -0.8681640625, -0.5872802734375, -0.306396484375, -0.0255126953125, 0.25537109375, 0.5362548828125, 0.817138671875, 1.0980224609375, 1.37890625, 1.6597900390625, 1.940673828125, 2.2215576171875, 2.50244140625, 2.7833251953125, 3.064208984375, 3.3450927734375, 3.6259765625, 3.9068603515625, 4.187744140625, 4.4686279296875, 4.74951171875, 5.0303955078125, 5.311279296875, 5.5921630859375, 5.873046875, 6.1539306640625, 6.434814453125, 6.7156982421875, 6.99658203125, 7.2774658203125, 7.558349609375, 7.8392333984375, 8.1201171875, 8.4010009765625, 8.681884765625, 8.9627685546875, 9.24365234375, 9.5245361328125, 9.805419921875, 10.0863037109375, 10.3671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 9.0, 26.0, 39.0, 81.0, 156.0, 210.0, 191.0, 134.0, 82.0, 39.0, 18.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.3468017578125, -166.20130920410156, -160.0558319091797, -153.91033935546875, -147.76486206054688, -141.61936950683594, -135.473876953125, -129.32839965820312, -123.18290710449219, -117.03742218017578, -110.89193725585938, -104.74644470214844, -98.60095977783203, -92.45547485351562, -86.30998229980469, -80.16449737548828, -74.01901245117188, -67.87352752685547, -61.7280387878418, -55.582550048828125, -49.43706512451172, -43.29158020019531, -37.14609146118164, -31.00060272216797, -24.855117797851562, -18.709630966186523, -12.564144134521484, -6.418657302856445, -0.27317047119140625, 5.872316360473633, 12.017803192138672, 18.163291931152344, 24.30877685546875, 30.45426368713379, 36.59975051879883, 42.7452392578125, 48.890724182128906, 55.03620910644531, 61.181697845458984, 67.32718658447266, 73.47267150878906, 79.61815643310547, 85.76364135742188, 91.90913391113281, 98.05461883544922, 104.20010375976562, 110.34559631347656, 116.49108123779297, 122.63656616210938, 128.7820587158203, 134.9275360107422, 141.07302856445312, 147.218505859375, 153.36399841308594, 159.50949096679688, 165.65496826171875, 171.8004608154297, 177.94595336914062, 184.0914306640625, 190.23692321777344, 196.38241577148438, 202.52789306640625, 208.6733856201172, 214.81887817382812, 220.96435546875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 10.0, 19.0, 16.0, 11.0, 18.0, 23.0, 21.0, 31.0, 24.0, 25.0, 27.0, 31.0, 39.0, 41.0, 52.0, 48.0, 52.0, 42.0, 42.0, 41.0, 33.0, 43.0, 36.0, 34.0, 32.0, 35.0, 21.0, 22.0, 17.0, 14.0, 12.0, 7.0, 13.0, 11.0, 11.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-72.09889221191406, -70.00700378417969, -67.91511535644531, -65.82323455810547, -63.731346130371094, -61.63945770263672, -59.547569274902344, -57.45568084716797, -55.36379623413086, -53.271907806396484, -51.180023193359375, -49.088134765625, -46.996246337890625, -44.904361724853516, -42.81247329711914, -40.72058868408203, -38.628700256347656, -36.53681182861328, -34.44492721557617, -32.3530387878418, -30.261152267456055, -28.169265747070312, -26.077377319335938, -23.985490798950195, -21.893604278564453, -19.80171775817871, -17.70983123779297, -15.617942810058594, -13.526056289672852, -11.43416976928711, -9.34228229522705, -7.250394821166992, -5.158515930175781, -3.066628932952881, -0.9747419357299805, 1.11714506149292, 3.2090320587158203, 5.3009185791015625, 7.392806053161621, 9.48469352722168, 11.576580047607422, 13.668466567993164, 15.760354042053223, 17.85224151611328, 19.944128036499023, 22.036014556884766, 24.12790298461914, 26.219789505004883, 28.311676025390625, 30.403562545776367, 32.49544906616211, 34.587337493896484, 36.679222106933594, 38.77111053466797, 40.862998962402344, 42.95488739013672, 45.04677200317383, 47.1386604309082, 49.23054504394531, 51.32243347167969, 53.41432189941406, 55.50620651245117, 57.59809494018555, 59.689979553222656, 61.78186798095703]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 12.0, 7.0, 7.0, 18.0, 25.0, 37.0, 52.0, 73.0, 128.0, 167.0, 288.0, 392.0, 636.0, 1073.0, 1724.0, 3093.0, 5907.0, 12133.0, 27312.0, 71997.0, 278254.0, 3078994.0, 537049.0, 105146.0, 36667.0, 15789.0, 7550.0, 3998.0, 2264.0, 1317.0, 812.0, 479.0, 303.0, 207.0, 125.0, 70.0, 53.0, 43.0, 26.0, 22.0, 13.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.7822265625, -15.267578125, -14.7529296875, -14.23828125, -13.7236328125, -13.208984375, -12.6943359375, -12.1796875, -11.6650390625, -11.150390625, -10.6357421875, -10.12109375, -9.6064453125, -9.091796875, -8.5771484375, -8.0625, -7.5478515625, -7.033203125, -6.5185546875, -6.00390625, -5.4892578125, -4.974609375, -4.4599609375, -3.9453125, -3.4306640625, -2.916015625, -2.4013671875, -1.88671875, -1.3720703125, -0.857421875, -0.3427734375, 0.171875, 0.6865234375, 1.201171875, 1.7158203125, 2.23046875, 2.7451171875, 3.259765625, 3.7744140625, 4.2890625, 4.8037109375, 5.318359375, 5.8330078125, 6.34765625, 6.8623046875, 7.376953125, 7.8916015625, 8.40625, 8.9208984375, 9.435546875, 9.9501953125, 10.46484375, 10.9794921875, 11.494140625, 12.0087890625, 12.5234375, 13.0380859375, 13.552734375, 14.0673828125, 14.58203125, 15.0966796875, 15.611328125, 16.1259765625, 16.640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 8.0, 12.0, 13.0, 21.0, 20.0, 18.0, 21.0, 30.0, 25.0, 22.0, 48.0, 29.0, 56.0, 44.0, 50.0, 46.0, 47.0, 52.0, 40.0, 33.0, 43.0, 37.0, 40.0, 38.0, 33.0, 29.0, 27.0, 18.0, 12.0, 15.0, 13.0, 23.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.5657958984375, -2.473388671875, -2.3809814453125, -2.28857421875, -2.1961669921875, -2.103759765625, -2.0113525390625, -1.9189453125, -1.8265380859375, -1.734130859375, -1.6417236328125, -1.54931640625, -1.4569091796875, -1.364501953125, -1.2720947265625, -1.1796875, -1.0872802734375, -0.994873046875, -0.9024658203125, -0.81005859375, -0.7176513671875, -0.625244140625, -0.5328369140625, -0.4404296875, -0.3480224609375, -0.255615234375, -0.1632080078125, -0.07080078125, 0.0216064453125, 0.114013671875, 0.2064208984375, 0.298828125, 0.3912353515625, 0.483642578125, 0.5760498046875, 0.66845703125, 0.7608642578125, 0.853271484375, 0.9456787109375, 1.0380859375, 1.1304931640625, 1.222900390625, 1.3153076171875, 1.40771484375, 1.5001220703125, 1.592529296875, 1.6849365234375, 1.77734375, 1.8697509765625, 1.962158203125, 2.0545654296875, 2.14697265625, 2.2393798828125, 2.331787109375, 2.4241943359375, 2.5166015625, 2.6090087890625, 2.701416015625, 2.7938232421875, 2.88623046875, 2.9786376953125, 3.071044921875, 3.1634521484375, 3.255859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 14.0, 18.0, 21.0, 28.0, 50.0, 59.0, 108.0, 192.0, 441.0, 1197.0, 3423.0, 13214.0, 68803.0, 738083.0, 3156358.0, 176343.0, 26605.0, 6129.0, 1821.0, 679.0, 281.0, 141.0, 61.0, 48.0, 28.0, 19.0, 22.0, 14.0, 14.0, 14.0, 5.0, 7.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0625, -23.2919921875, -22.521484375, -21.7509765625, -20.98046875, -20.2099609375, -19.439453125, -18.6689453125, -17.8984375, -17.1279296875, -16.357421875, -15.5869140625, -14.81640625, -14.0458984375, -13.275390625, -12.5048828125, -11.734375, -10.9638671875, -10.193359375, -9.4228515625, -8.65234375, -7.8818359375, -7.111328125, -6.3408203125, -5.5703125, -4.7998046875, -4.029296875, -3.2587890625, -2.48828125, -1.7177734375, -0.947265625, -0.1767578125, 0.59375, 1.3642578125, 2.134765625, 2.9052734375, 3.67578125, 4.4462890625, 5.216796875, 5.9873046875, 6.7578125, 7.5283203125, 8.298828125, 9.0693359375, 9.83984375, 10.6103515625, 11.380859375, 12.1513671875, 12.921875, 13.6923828125, 14.462890625, 15.2333984375, 16.00390625, 16.7744140625, 17.544921875, 18.3154296875, 19.0859375, 19.8564453125, 20.626953125, 21.3974609375, 22.16796875, 22.9384765625, 23.708984375, 24.4794921875, 25.25]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 8.0, 2.0, 8.0, 15.0, 15.0, 35.0, 31.0, 55.0, 70.0, 113.0, 190.0, 360.0, 759.0, 1230.0, 469.0, 245.0, 163.0, 91.0, 70.0, 51.0, 25.0, 21.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.765625, -10.50457763671875, -10.2435302734375, -9.98248291015625, -9.721435546875, -9.46038818359375, -9.1993408203125, -8.93829345703125, -8.67724609375, -8.41619873046875, -8.1551513671875, -7.89410400390625, -7.633056640625, -7.37200927734375, -7.1109619140625, -6.84991455078125, -6.5888671875, -6.32781982421875, -6.0667724609375, -5.80572509765625, -5.544677734375, -5.28363037109375, -5.0225830078125, -4.76153564453125, -4.50048828125, -4.23944091796875, -3.9783935546875, -3.71734619140625, -3.456298828125, -3.19525146484375, -2.9342041015625, -2.67315673828125, -2.412109375, -2.15106201171875, -1.8900146484375, -1.62896728515625, -1.367919921875, -1.10687255859375, -0.8458251953125, -0.58477783203125, -0.32373046875, -0.06268310546875, 0.1983642578125, 0.45941162109375, 0.720458984375, 0.98150634765625, 1.2425537109375, 1.50360107421875, 1.7646484375, 2.02569580078125, 2.2867431640625, 2.54779052734375, 2.808837890625, 3.06988525390625, 3.3309326171875, 3.59197998046875, 3.85302734375, 4.11407470703125, 4.3751220703125, 4.63616943359375, 4.897216796875, 5.15826416015625, 5.4193115234375, 5.68035888671875, 5.94140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 16.0, 48.0, 91.0, 169.0, 247.0, 217.0, 105.0, 54.0, 26.0, 10.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-160.65032958984375, -157.3536834716797, -154.05703735351562, -150.76040649414062, -147.46376037597656, -144.1671142578125, -140.87046813964844, -137.57382202148438, -134.2771759033203, -130.98052978515625, -127.68389129638672, -124.38724517822266, -121.0905990600586, -117.79396057128906, -114.497314453125, -111.20066833496094, -107.90403747558594, -104.60739135742188, -101.31075286865234, -98.01410675048828, -94.71746063232422, -91.42082214355469, -88.12417602539062, -84.82752990722656, -81.5308837890625, -78.23423767089844, -74.9375991821289, -71.64095306396484, -68.34430694580078, -65.04766845703125, -61.75102233886719, -58.45438003540039, -55.15774154663086, -51.86109924316406, -48.564453125, -45.2678108215332, -41.971168518066406, -38.674522399902344, -35.37788009643555, -32.08123779296875, -28.78459358215332, -25.48794937133789, -22.191307067871094, -18.894662857055664, -15.59801959991455, -12.301376342773438, -9.004732131958008, -5.708089828491211, -2.4114456176757812, 0.8851978778839111, 4.1818413734436035, 7.478485107421875, 10.775128364562988, 14.071771621704102, 17.36841583251953, 20.665058135986328, 23.961702346801758, 27.258346557617188, 30.554988861083984, 33.85163116455078, 37.148277282714844, 40.44491958618164, 43.74156188964844, 47.0382080078125, 50.3348503112793]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 7.0, 8.0, 7.0, 7.0, 17.0, 13.0, 11.0, 16.0, 19.0, 23.0, 20.0, 30.0, 31.0, 23.0, 37.0, 39.0, 32.0, 42.0, 41.0, 38.0, 50.0, 36.0, 40.0, 29.0, 38.0, 47.0, 52.0, 34.0, 23.0, 21.0, 27.0, 16.0, 24.0, 15.0, 9.0, 17.0, 8.0, 6.0, 7.0, 6.0, 7.0, 5.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.069576263427734, -20.323698043823242, -19.57781982421875, -18.83194351196289, -18.0860652923584, -17.340187072753906, -16.594308853149414, -15.848430633544922, -15.102553367614746, -14.356675148010254, -13.610797882080078, -12.864919662475586, -12.119041442871094, -11.373164176940918, -10.627285957336426, -9.88140869140625, -9.135530471801758, -8.389652252197266, -7.64377498626709, -6.897896766662598, -6.152019023895264, -5.40614128112793, -4.6602630615234375, -3.9143853187561035, -3.1685075759887695, -2.4226298332214355, -1.6767518520355225, -0.9308738708496094, -0.1849961280822754, 0.5608816146850586, 1.3067598342895508, 2.0526375770568848, 2.7985172271728516, 3.5443949699401855, 4.2902727127075195, 5.036150932312012, 5.782028675079346, 6.52790641784668, 7.273784637451172, 8.019662857055664, 8.76554012298584, 9.511418342590332, 10.257295608520508, 11.003173828125, 11.749052047729492, 12.494929313659668, 13.24080753326416, 13.986684799194336, 14.732563018798828, 15.47844123840332, 16.224319458007812, 16.970195770263672, 17.716073989868164, 18.461952209472656, 19.20783042907715, 19.95370864868164, 20.6995849609375, 21.445463180541992, 22.191341400146484, 22.937217712402344, 23.683095932006836, 24.428974151611328, 25.17485237121582, 25.920730590820312, 26.666608810424805]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 12.0, 17.0, 29.0, 41.0, 76.0, 113.0, 173.0, 272.0, 464.0, 801.0, 1452.0, 2705.0, 5657.0, 11664.0, 25563.0, 59120.0, 163087.0, 469149.0, 188661.0, 65878.0, 27966.0, 12857.0, 6054.0, 3002.0, 1552.0, 861.0, 495.0, 293.0, 197.0, 126.0, 77.0, 55.0, 30.0, 17.0, 14.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.953125, -19.421875, -18.890625, -18.359375, -17.828125, -17.296875, -16.765625, -16.234375, -15.703125, -15.171875, -14.640625, -14.109375, -13.578125, -13.046875, -12.515625, -11.984375, -11.453125, -10.921875, -10.390625, -9.859375, -9.328125, -8.796875, -8.265625, -7.734375, -7.203125, -6.671875, -6.140625, -5.609375, -5.078125, -4.546875, -4.015625, -3.484375, -2.953125, -2.421875, -1.890625, -1.359375, -0.828125, -0.296875, 0.234375, 0.765625, 1.296875, 1.828125, 2.359375, 2.890625, 3.421875, 3.953125, 4.484375, 5.015625, 5.546875, 6.078125, 6.609375, 7.140625, 7.671875, 8.203125, 8.734375, 9.265625, 9.796875, 10.328125, 10.859375, 11.390625, 11.921875, 12.453125, 12.984375, 13.515625, 14.046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 17.0, 10.0, 9.0, 20.0, 29.0, 16.0, 28.0, 27.0, 37.0, 28.0, 24.0, 41.0, 55.0, 40.0, 62.0, 41.0, 50.0, 39.0, 41.0, 34.0, 42.0, 46.0, 32.0, 42.0, 32.0, 24.0, 20.0, 28.0, 10.0, 16.0, 14.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.30645751953125, -2.2144775390625, -2.12249755859375, -2.030517578125, -1.93853759765625, -1.8465576171875, -1.75457763671875, -1.66259765625, -1.57061767578125, -1.4786376953125, -1.38665771484375, -1.294677734375, -1.20269775390625, -1.1107177734375, -1.01873779296875, -0.9267578125, -0.83477783203125, -0.7427978515625, -0.65081787109375, -0.558837890625, -0.46685791015625, -0.3748779296875, -0.28289794921875, -0.19091796875, -0.09893798828125, -0.0069580078125, 0.08502197265625, 0.177001953125, 0.26898193359375, 0.3609619140625, 0.45294189453125, 0.544921875, 0.63690185546875, 0.7288818359375, 0.82086181640625, 0.912841796875, 1.00482177734375, 1.0968017578125, 1.18878173828125, 1.28076171875, 1.37274169921875, 1.4647216796875, 1.55670166015625, 1.648681640625, 1.74066162109375, 1.8326416015625, 1.92462158203125, 2.0166015625, 2.10858154296875, 2.2005615234375, 2.29254150390625, 2.384521484375, 2.47650146484375, 2.5684814453125, 2.66046142578125, 2.75244140625, 2.84442138671875, 2.9364013671875, 3.02838134765625, 3.120361328125, 3.21234130859375, 3.3043212890625, 3.39630126953125, 3.48828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 16.0, 17.0, 17.0, 22.0, 26.0, 49.0, 59.0, 73.0, 105.0, 125.0, 171.0, 249.0, 335.0, 494.0, 901.0, 1883.0, 5178.0, 15915.0, 53877.0, 194358.0, 545818.0, 161293.0, 45258.0, 13606.0, 4430.0, 1750.0, 863.0, 445.0, 321.0, 237.0, 166.0, 126.0, 90.0, 76.0, 52.0, 39.0, 29.0, 14.0, 17.0, 13.0, 12.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.46875, -15.94482421875, -15.4208984375, -14.89697265625, -14.373046875, -13.84912109375, -13.3251953125, -12.80126953125, -12.27734375, -11.75341796875, -11.2294921875, -10.70556640625, -10.181640625, -9.65771484375, -9.1337890625, -8.60986328125, -8.0859375, -7.56201171875, -7.0380859375, -6.51416015625, -5.990234375, -5.46630859375, -4.9423828125, -4.41845703125, -3.89453125, -3.37060546875, -2.8466796875, -2.32275390625, -1.798828125, -1.27490234375, -0.7509765625, -0.22705078125, 0.296875, 0.82080078125, 1.3447265625, 1.86865234375, 2.392578125, 2.91650390625, 3.4404296875, 3.96435546875, 4.48828125, 5.01220703125, 5.5361328125, 6.06005859375, 6.583984375, 7.10791015625, 7.6318359375, 8.15576171875, 8.6796875, 9.20361328125, 9.7275390625, 10.25146484375, 10.775390625, 11.29931640625, 11.8232421875, 12.34716796875, 12.87109375, 13.39501953125, 13.9189453125, 14.44287109375, 14.966796875, 15.49072265625, 16.0146484375, 16.53857421875, 17.0625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 5.0, 14.0, 12.0, 27.0, 12.0, 12.0, 21.0, 22.0, 33.0, 26.0, 34.0, 31.0, 31.0, 38.0, 42.0, 52.0, 42.0, 44.0, 47.0, 28.0, 42.0, 39.0, 34.0, 41.0, 36.0, 32.0, 27.0, 36.0, 17.0, 18.0, 23.0, 16.0, 14.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-13.171875, -12.8050537109375, -12.438232421875, -12.0714111328125, -11.70458984375, -11.3377685546875, -10.970947265625, -10.6041259765625, -10.2373046875, -9.8704833984375, -9.503662109375, -9.1368408203125, -8.77001953125, -8.4031982421875, -8.036376953125, -7.6695556640625, -7.302734375, -6.9359130859375, -6.569091796875, -6.2022705078125, -5.83544921875, -5.4686279296875, -5.101806640625, -4.7349853515625, -4.3681640625, -4.0013427734375, -3.634521484375, -3.2677001953125, -2.90087890625, -2.5340576171875, -2.167236328125, -1.8004150390625, -1.43359375, -1.0667724609375, -0.699951171875, -0.3331298828125, 0.03369140625, 0.4005126953125, 0.767333984375, 1.1341552734375, 1.5009765625, 1.8677978515625, 2.234619140625, 2.6014404296875, 2.96826171875, 3.3350830078125, 3.701904296875, 4.0687255859375, 4.435546875, 4.8023681640625, 5.169189453125, 5.5360107421875, 5.90283203125, 6.2696533203125, 6.636474609375, 7.0032958984375, 7.3701171875, 7.7369384765625, 8.103759765625, 8.4705810546875, 8.83740234375, 9.2042236328125, 9.571044921875, 9.9378662109375, 10.3046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 2.0, 7.0, 14.0, 23.0, 24.0, 60.0, 82.0, 152.0, 227.0, 411.0, 869.0, 2541.0, 10480.0, 59559.0, 538587.0, 378649.0, 44848.0, 8155.0, 2113.0, 802.0, 377.0, 214.0, 109.0, 89.0, 47.0, 27.0, 22.0, 10.0, 15.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.2490234375, -12.833984375, -12.4189453125, -12.00390625, -11.5888671875, -11.173828125, -10.7587890625, -10.34375, -9.9287109375, -9.513671875, -9.0986328125, -8.68359375, -8.2685546875, -7.853515625, -7.4384765625, -7.0234375, -6.6083984375, -6.193359375, -5.7783203125, -5.36328125, -4.9482421875, -4.533203125, -4.1181640625, -3.703125, -3.2880859375, -2.873046875, -2.4580078125, -2.04296875, -1.6279296875, -1.212890625, -0.7978515625, -0.3828125, 0.0322265625, 0.447265625, 0.8623046875, 1.27734375, 1.6923828125, 2.107421875, 2.5224609375, 2.9375, 3.3525390625, 3.767578125, 4.1826171875, 4.59765625, 5.0126953125, 5.427734375, 5.8427734375, 6.2578125, 6.6728515625, 7.087890625, 7.5029296875, 7.91796875, 8.3330078125, 8.748046875, 9.1630859375, 9.578125, 9.9931640625, 10.408203125, 10.8232421875, 11.23828125, 11.6533203125, 12.068359375, 12.4833984375, 12.8984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 10.0, 13.0, 9.0, 18.0, 18.0, 22.0, 29.0, 39.0, 96.0, 195.0, 223.0, 98.0, 33.0, 40.0, 23.0, 27.0, 21.0, 11.0, 7.0, 5.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001407623291015625, -0.0013535618782043457, -0.0012995004653930664, -0.0012454390525817871, -0.0011913776397705078, -0.0011373162269592285, -0.0010832548141479492, -0.00102919340133667, -0.0009751319885253906, -0.0009210705757141113, -0.000867009162902832, -0.0008129477500915527, -0.0007588863372802734, -0.0007048249244689941, -0.0006507635116577148, -0.0005967020988464355, -0.0005426406860351562, -0.000488579273223877, -0.00043451786041259766, -0.00038045644760131836, -0.00032639503479003906, -0.00027233362197875977, -0.00021827220916748047, -0.00016421079635620117, -0.00011014938354492188, -5.608797073364258e-05, -2.0265579223632812e-06, 5.2034854888916016e-05, 0.00010609626770019531, 0.0001601576805114746, 0.0002142190933227539, 0.0002682805061340332, 0.0003223419189453125, 0.0003764033317565918, 0.0004304647445678711, 0.0004845261573791504, 0.0005385875701904297, 0.000592648983001709, 0.0006467103958129883, 0.0007007718086242676, 0.0007548332214355469, 0.0008088946342468262, 0.0008629560470581055, 0.0009170174598693848, 0.0009710788726806641, 0.0010251402854919434, 0.0010792016983032227, 0.001133263111114502, 0.0011873245239257812, 0.0012413859367370605, 0.0012954473495483398, 0.0013495087623596191, 0.0014035701751708984, 0.0014576315879821777, 0.001511693000793457, 0.0015657544136047363, 0.0016198158264160156, 0.001673877239227295, 0.0017279386520385742, 0.0017820000648498535, 0.0018360614776611328, 0.0018901228904724121, 0.0019441843032836914, 0.0019982457160949707, 0.00205230712890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 11.0, 11.0, 13.0, 25.0, 38.0, 68.0, 106.0, 181.0, 370.0, 805.0, 2653.0, 20759.0, 635327.0, 370033.0, 14534.0, 2191.0, 685.0, 351.0, 178.0, 74.0, 60.0, 31.0, 20.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.953125, -17.170166015625, -16.38720703125, -15.604248046875, -14.8212890625, -14.038330078125, -13.25537109375, -12.472412109375, -11.689453125, -10.906494140625, -10.12353515625, -9.340576171875, -8.5576171875, -7.774658203125, -6.99169921875, -6.208740234375, -5.42578125, -4.642822265625, -3.85986328125, -3.076904296875, -2.2939453125, -1.510986328125, -0.72802734375, 0.054931640625, 0.837890625, 1.620849609375, 2.40380859375, 3.186767578125, 3.9697265625, 4.752685546875, 5.53564453125, 6.318603515625, 7.1015625, 7.884521484375, 8.66748046875, 9.450439453125, 10.2333984375, 11.016357421875, 11.79931640625, 12.582275390625, 13.365234375, 14.148193359375, 14.93115234375, 15.714111328125, 16.4970703125, 17.280029296875, 18.06298828125, 18.845947265625, 19.62890625, 20.411865234375, 21.19482421875, 21.977783203125, 22.7607421875, 23.543701171875, 24.32666015625, 25.109619140625, 25.892578125, 26.675537109375, 27.45849609375, 28.241455078125, 29.0244140625, 29.807373046875, 30.59033203125, 31.373291015625, 32.15625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 4.0, 11.0, 9.0, 16.0, 17.0, 24.0, 29.0, 34.0, 50.0, 62.0, 84.0, 109.0, 105.0, 89.0, 61.0, 65.0, 39.0, 33.0, 26.0, 23.0, 15.0, 14.0, 22.0, 9.0, 5.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.5625, -7.33514404296875, -7.1077880859375, -6.88043212890625, -6.653076171875, -6.42572021484375, -6.1983642578125, -5.97100830078125, -5.74365234375, -5.51629638671875, -5.2889404296875, -5.06158447265625, -4.834228515625, -4.60687255859375, -4.3795166015625, -4.15216064453125, -3.9248046875, -3.69744873046875, -3.4700927734375, -3.24273681640625, -3.015380859375, -2.78802490234375, -2.5606689453125, -2.33331298828125, -2.10595703125, -1.87860107421875, -1.6512451171875, -1.42388916015625, -1.196533203125, -0.96917724609375, -0.7418212890625, -0.51446533203125, -0.287109375, -0.05975341796875, 0.1676025390625, 0.39495849609375, 0.622314453125, 0.84967041015625, 1.0770263671875, 1.30438232421875, 1.53173828125, 1.75909423828125, 1.9864501953125, 2.21380615234375, 2.441162109375, 2.66851806640625, 2.8958740234375, 3.12322998046875, 3.3505859375, 3.57794189453125, 3.8052978515625, 4.03265380859375, 4.260009765625, 4.48736572265625, 4.7147216796875, 4.94207763671875, 5.16943359375, 5.39678955078125, 5.6241455078125, 5.85150146484375, 6.078857421875, 6.30621337890625, 6.5335693359375, 6.76092529296875, 6.98828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 21.0, 49.0, 99.0, 147.0, 210.0, 186.0, 143.0, 63.0, 34.0, 23.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.17317199707031, -59.779273986816406, -54.3853759765625, -48.99147415161133, -43.59757614135742, -38.203678131103516, -32.809776306152344, -27.415878295898438, -22.02198028564453, -16.628082275390625, -11.234182357788086, -5.840282440185547, -0.4463844299316406, 4.947513580322266, 10.341415405273438, 15.735313415527344, 21.12921142578125, 26.523109436035156, 31.917009353637695, 37.310909271240234, 42.70480728149414, 48.09870529174805, 53.49260711669922, 58.886505126953125, 64.28040313720703, 69.67430114746094, 75.06819915771484, 80.46209716796875, 85.85600280761719, 91.24989318847656, 96.643798828125, 102.0376968383789, 107.43157958984375, 112.82547760009766, 118.21937561035156, 123.61328125, 129.00717163085938, 134.4010772705078, 139.79498291015625, 145.18887329101562, 150.582763671875, 155.97666931152344, 161.3705596923828, 166.76446533203125, 172.15835571289062, 177.55226135253906, 182.9461669921875, 188.34005737304688, 193.7339630126953, 199.12786865234375, 204.52175903320312, 209.91566467285156, 215.30955505371094, 220.70346069335938, 226.09735107421875, 231.4912567138672, 236.88516235351562, 242.27906799316406, 247.67295837402344, 253.06686401367188, 258.46075439453125, 263.8546447753906, 269.2485656738281, 274.6424560546875, 280.0363464355469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 9.0, 14.0, 8.0, 12.0, 14.0, 11.0, 14.0, 16.0, 16.0, 26.0, 27.0, 23.0, 31.0, 39.0, 35.0, 44.0, 38.0, 22.0, 60.0, 41.0, 41.0, 44.0, 46.0, 38.0, 38.0, 37.0, 28.0, 37.0, 28.0, 35.0, 24.0, 25.0, 13.0, 8.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.59772491455078, -58.66156005859375, -56.72539520263672, -54.78923034667969, -52.853065490722656, -50.916900634765625, -48.98073959350586, -47.04457473754883, -45.1084098815918, -43.172245025634766, -41.236080169677734, -39.2999153137207, -37.36375427246094, -35.427589416503906, -33.491424560546875, -31.555259704589844, -29.619094848632812, -27.68292999267578, -25.74676513671875, -23.81060218811035, -21.87443733215332, -19.93827247619629, -18.00210952758789, -16.06594467163086, -14.129779815673828, -12.193614959716797, -10.257451057434082, -8.321287155151367, -6.385122299194336, -4.448957443237305, -2.51279354095459, -0.576629638671875, 1.3595314025878906, 3.2956957817077637, 5.231860160827637, 7.16802453994751, 9.104188919067383, 11.040353775024414, 12.976517677307129, 14.912681579589844, 16.848846435546875, 18.785011291503906, 20.721176147460938, 22.657339096069336, 24.593503952026367, 26.5296688079834, 28.465831756591797, 30.401996612548828, 32.33816146850586, 34.27432632446289, 36.21049118041992, 38.14665603637695, 40.08281707763672, 42.01898193359375, 43.95514678955078, 45.89131164550781, 47.827476501464844, 49.763641357421875, 51.699806213378906, 53.63597106933594, 55.57213592529297, 57.50830078125, 59.444461822509766, 61.3806266784668, 63.31679153442383]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 2.0, 7.0, 8.0, 21.0, 16.0, 22.0, 34.0, 38.0, 83.0, 114.0, 224.0, 450.0, 1096.0, 3001.0, 9471.0, 40717.0, 536180.0, 3496137.0, 83700.0, 15684.0, 4394.0, 1508.0, 662.0, 281.0, 167.0, 86.0, 54.0, 39.0, 21.0, 21.0, 7.0, 9.0, 4.0, 3.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.33984375, -34.0859375, -32.83203125, -31.578125, -30.32421875, -29.0703125, -27.81640625, -26.5625, -25.30859375, -24.0546875, -22.80078125, -21.546875, -20.29296875, -19.0390625, -17.78515625, -16.53125, -15.27734375, -14.0234375, -12.76953125, -11.515625, -10.26171875, -9.0078125, -7.75390625, -6.5, -5.24609375, -3.9921875, -2.73828125, -1.484375, -0.23046875, 1.0234375, 2.27734375, 3.53125, 4.78515625, 6.0390625, 7.29296875, 8.546875, 9.80078125, 11.0546875, 12.30859375, 13.5625, 14.81640625, 16.0703125, 17.32421875, 18.578125, 19.83203125, 21.0859375, 22.33984375, 23.59375, 24.84765625, 26.1015625, 27.35546875, 28.609375, 29.86328125, 31.1171875, 32.37109375, 33.625, 34.87890625, 36.1328125, 37.38671875, 38.640625, 39.89453125, 41.1484375, 42.40234375, 43.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 13.0, 13.0, 14.0, 17.0, 19.0, 18.0, 31.0, 29.0, 33.0, 34.0, 40.0, 33.0, 49.0, 58.0, 57.0, 49.0, 39.0, 38.0, 40.0, 51.0, 43.0, 31.0, 37.0, 44.0, 20.0, 20.0, 21.0, 22.0, 16.0, 11.0, 14.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.921875, -2.82684326171875, -2.7318115234375, -2.63677978515625, -2.541748046875, -2.44671630859375, -2.3516845703125, -2.25665283203125, -2.16162109375, -2.06658935546875, -1.9715576171875, -1.87652587890625, -1.781494140625, -1.68646240234375, -1.5914306640625, -1.49639892578125, -1.4013671875, -1.30633544921875, -1.2113037109375, -1.11627197265625, -1.021240234375, -0.92620849609375, -0.8311767578125, -0.73614501953125, -0.64111328125, -0.54608154296875, -0.4510498046875, -0.35601806640625, -0.260986328125, -0.16595458984375, -0.0709228515625, 0.02410888671875, 0.119140625, 0.21417236328125, 0.3092041015625, 0.40423583984375, 0.499267578125, 0.59429931640625, 0.6893310546875, 0.78436279296875, 0.87939453125, 0.97442626953125, 1.0694580078125, 1.16448974609375, 1.259521484375, 1.35455322265625, 1.4495849609375, 1.54461669921875, 1.6396484375, 1.73468017578125, 1.8297119140625, 1.92474365234375, 2.019775390625, 2.11480712890625, 2.2098388671875, 2.30487060546875, 2.39990234375, 2.49493408203125, 2.5899658203125, 2.68499755859375, 2.780029296875, 2.87506103515625, 2.9700927734375, 3.06512451171875, 3.16015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 9.0, 8.0, 20.0, 18.0, 22.0, 28.0, 30.0, 44.0, 44.0, 59.0, 71.0, 126.0, 164.0, 262.0, 557.0, 1348.0, 5035.0, 28460.0, 387352.0, 3639693.0, 112501.0, 13299.0, 2862.0, 934.0, 427.0, 238.0, 118.0, 103.0, 80.0, 81.0, 47.0, 38.0, 31.0, 37.0, 27.0, 22.0, 15.0, 11.0, 16.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.05029296875, -29.9130859375, -28.77587890625, -27.638671875, -26.50146484375, -25.3642578125, -24.22705078125, -23.08984375, -21.95263671875, -20.8154296875, -19.67822265625, -18.541015625, -17.40380859375, -16.2666015625, -15.12939453125, -13.9921875, -12.85498046875, -11.7177734375, -10.58056640625, -9.443359375, -8.30615234375, -7.1689453125, -6.03173828125, -4.89453125, -3.75732421875, -2.6201171875, -1.48291015625, -0.345703125, 0.79150390625, 1.9287109375, 3.06591796875, 4.203125, 5.34033203125, 6.4775390625, 7.61474609375, 8.751953125, 9.88916015625, 11.0263671875, 12.16357421875, 13.30078125, 14.43798828125, 15.5751953125, 16.71240234375, 17.849609375, 18.98681640625, 20.1240234375, 21.26123046875, 22.3984375, 23.53564453125, 24.6728515625, 25.81005859375, 26.947265625, 28.08447265625, 29.2216796875, 30.35888671875, 31.49609375, 32.63330078125, 33.7705078125, 34.90771484375, 36.044921875, 37.18212890625, 38.3193359375, 39.45654296875, 40.59375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 24.0, 19.0, 60.0, 92.0, 212.0, 520.0, 1956.0, 696.0, 250.0, 102.0, 58.0, 33.0, 11.0, 13.0, 9.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.637939453125, -6.21337890625, -5.788818359375, -5.3642578125, -4.939697265625, -4.51513671875, -4.090576171875, -3.666015625, -3.241455078125, -2.81689453125, -2.392333984375, -1.9677734375, -1.543212890625, -1.11865234375, -0.694091796875, -0.26953125, 0.155029296875, 0.57958984375, 1.004150390625, 1.4287109375, 1.853271484375, 2.27783203125, 2.702392578125, 3.126953125, 3.551513671875, 3.97607421875, 4.400634765625, 4.8251953125, 5.249755859375, 5.67431640625, 6.098876953125, 6.5234375, 6.947998046875, 7.37255859375, 7.797119140625, 8.2216796875, 8.646240234375, 9.07080078125, 9.495361328125, 9.919921875, 10.344482421875, 10.76904296875, 11.193603515625, 11.6181640625, 12.042724609375, 12.46728515625, 12.891845703125, 13.31640625, 13.740966796875, 14.16552734375, 14.590087890625, 15.0146484375, 15.439208984375, 15.86376953125, 16.288330078125, 16.712890625, 17.137451171875, 17.56201171875, 17.986572265625, 18.4111328125, 18.835693359375, 19.26025390625, 19.684814453125, 20.109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 40.0, 71.0, 177.0, 221.0, 189.0, 145.0, 87.0, 27.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.99659729003906, -132.76165771484375, -129.52670288085938, -126.29175567626953, -123.05680847167969, -119.82186126708984, -116.5869140625, -113.35196685791016, -110.11701965332031, -106.88207244873047, -103.64712524414062, -100.41217803955078, -97.17723083496094, -93.9422836303711, -90.70733642578125, -87.4723892211914, -84.23744201660156, -81.00249481201172, -77.76754760742188, -74.53260040283203, -71.29765319824219, -68.06270599365234, -64.8277587890625, -61.592811584472656, -58.35786437988281, -55.12291717529297, -51.887969970703125, -48.65302276611328, -45.41807556152344, -42.183128356933594, -38.94818115234375, -35.713233947753906, -32.47828674316406, -29.24333953857422, -26.008392333984375, -22.77344512939453, -19.538497924804688, -16.303550720214844, -13.068603515625, -9.833656311035156, -6.5987091064453125, -3.3637619018554688, -0.128814697265625, 3.1061325073242188, 6.3410797119140625, 9.576026916503906, 12.81097412109375, 16.045921325683594, 19.280868530273438, 22.51581573486328, 25.750762939453125, 28.98571014404297, 32.22065734863281, 35.455604553222656, 38.6905517578125, 41.925498962402344, 45.16044616699219, 48.39539337158203, 51.630340576171875, 54.86528778076172, 58.10023498535156, 61.335182189941406, 64.57012939453125, 67.8050765991211, 71.04002380371094]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 9.0, 5.0, 4.0, 8.0, 16.0, 15.0, 17.0, 22.0, 30.0, 34.0, 29.0, 40.0, 49.0, 45.0, 49.0, 61.0, 54.0, 42.0, 51.0, 36.0, 43.0, 48.0, 45.0, 44.0, 31.0, 31.0, 16.0, 24.0, 18.0, 13.0, 11.0, 11.0, 12.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-36.22332000732422, -35.2440071105957, -34.26469421386719, -33.28538131713867, -32.306068420410156, -31.32675552368164, -30.347442626953125, -29.36812973022461, -28.388816833496094, -27.409503936767578, -26.430191040039062, -25.450878143310547, -24.47156524658203, -23.492252349853516, -22.512939453125, -21.533626556396484, -20.5543155670166, -19.575002670288086, -18.59568977355957, -17.616376876831055, -16.63706398010254, -15.657751083374023, -14.678439140319824, -13.699126243591309, -12.719813346862793, -11.740500450134277, -10.761187553405762, -9.781875610351562, -8.802562713623047, -7.823249340057373, -6.843936920166016, -5.8646240234375, -4.885311126708984, -3.9059982299804688, -2.9266855716705322, -1.9473729133605957, -0.9680600166320801, 0.011252880096435547, 0.990565299987793, 1.9698781967163086, 2.949191093444824, 3.92850399017334, 4.9078168869018555, 5.887129306793213, 6.8664422035217285, 7.845755100250244, 8.825067520141602, 9.804380416870117, 10.783693313598633, 11.763006210327148, 12.742319107055664, 13.72163200378418, 14.700944900512695, 15.680257797241211, 16.659568786621094, 17.63888168334961, 18.618194580078125, 19.59750747680664, 20.576820373535156, 21.556133270263672, 22.535446166992188, 23.514759063720703, 24.49407196044922, 25.473384857177734, 26.45269775390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 20.0, 30.0, 45.0, 46.0, 65.0, 128.0, 160.0, 260.0, 404.0, 806.0, 1502.0, 3110.0, 7103.0, 16944.0, 42840.0, 123992.0, 509438.0, 231819.0, 65666.0, 24904.0, 10255.0, 4374.0, 2079.0, 1015.0, 568.0, 336.0, 215.0, 146.0, 81.0, 54.0, 40.0, 19.0, 18.0, 15.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.777099609375, -15.16357421875, -14.550048828125, -13.9365234375, -13.322998046875, -12.70947265625, -12.095947265625, -11.482421875, -10.868896484375, -10.25537109375, -9.641845703125, -9.0283203125, -8.414794921875, -7.80126953125, -7.187744140625, -6.57421875, -5.960693359375, -5.34716796875, -4.733642578125, -4.1201171875, -3.506591796875, -2.89306640625, -2.279541015625, -1.666015625, -1.052490234375, -0.43896484375, 0.174560546875, 0.7880859375, 1.401611328125, 2.01513671875, 2.628662109375, 3.2421875, 3.855712890625, 4.46923828125, 5.082763671875, 5.6962890625, 6.309814453125, 6.92333984375, 7.536865234375, 8.150390625, 8.763916015625, 9.37744140625, 9.990966796875, 10.6044921875, 11.218017578125, 11.83154296875, 12.445068359375, 13.05859375, 13.672119140625, 14.28564453125, 14.899169921875, 15.5126953125, 16.126220703125, 16.73974609375, 17.353271484375, 17.966796875, 18.580322265625, 19.19384765625, 19.807373046875, 20.4208984375, 21.034423828125, 21.64794921875, 22.261474609375, 22.875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 18.0, 20.0, 9.0, 16.0, 33.0, 28.0, 22.0, 21.0, 38.0, 30.0, 40.0, 44.0, 43.0, 46.0, 54.0, 44.0, 49.0, 49.0, 42.0, 49.0, 37.0, 39.0, 40.0, 30.0, 31.0, 18.0, 17.0, 24.0, 15.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8299560546875, -2.730224609375, -2.6304931640625, -2.53076171875, -2.4310302734375, -2.331298828125, -2.2315673828125, -2.1318359375, -2.0321044921875, -1.932373046875, -1.8326416015625, -1.73291015625, -1.6331787109375, -1.533447265625, -1.4337158203125, -1.333984375, -1.2342529296875, -1.134521484375, -1.0347900390625, -0.93505859375, -0.8353271484375, -0.735595703125, -0.6358642578125, -0.5361328125, -0.4364013671875, -0.336669921875, -0.2369384765625, -0.13720703125, -0.0374755859375, 0.062255859375, 0.1619873046875, 0.26171875, 0.3614501953125, 0.461181640625, 0.5609130859375, 0.66064453125, 0.7603759765625, 0.860107421875, 0.9598388671875, 1.0595703125, 1.1593017578125, 1.259033203125, 1.3587646484375, 1.45849609375, 1.5582275390625, 1.657958984375, 1.7576904296875, 1.857421875, 1.9571533203125, 2.056884765625, 2.1566162109375, 2.25634765625, 2.3560791015625, 2.455810546875, 2.5555419921875, 2.6552734375, 2.7550048828125, 2.854736328125, 2.9544677734375, 3.05419921875, 3.1539306640625, 3.253662109375, 3.3533935546875, 3.453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 10.0, 13.0, 13.0, 15.0, 25.0, 24.0, 25.0, 47.0, 83.0, 121.0, 195.0, 356.0, 643.0, 1302.0, 2881.0, 7113.0, 17785.0, 46996.0, 143077.0, 499383.0, 222601.0, 64866.0, 24185.0, 9365.0, 3835.0, 1671.0, 792.0, 395.0, 237.0, 150.0, 100.0, 60.0, 54.0, 33.0, 33.0, 15.0, 16.0, 13.0, 3.0, 4.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.734375, -14.296630859375, -13.85888671875, -13.421142578125, -12.9833984375, -12.545654296875, -12.10791015625, -11.670166015625, -11.232421875, -10.794677734375, -10.35693359375, -9.919189453125, -9.4814453125, -9.043701171875, -8.60595703125, -8.168212890625, -7.73046875, -7.292724609375, -6.85498046875, -6.417236328125, -5.9794921875, -5.541748046875, -5.10400390625, -4.666259765625, -4.228515625, -3.790771484375, -3.35302734375, -2.915283203125, -2.4775390625, -2.039794921875, -1.60205078125, -1.164306640625, -0.7265625, -0.288818359375, 0.14892578125, 0.586669921875, 1.0244140625, 1.462158203125, 1.89990234375, 2.337646484375, 2.775390625, 3.213134765625, 3.65087890625, 4.088623046875, 4.5263671875, 4.964111328125, 5.40185546875, 5.839599609375, 6.27734375, 6.715087890625, 7.15283203125, 7.590576171875, 8.0283203125, 8.466064453125, 8.90380859375, 9.341552734375, 9.779296875, 10.217041015625, 10.65478515625, 11.092529296875, 11.5302734375, 11.968017578125, 12.40576171875, 12.843505859375, 13.28125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 8.0, 12.0, 8.0, 9.0, 10.0, 11.0, 12.0, 11.0, 22.0, 28.0, 44.0, 24.0, 44.0, 37.0, 46.0, 38.0, 41.0, 50.0, 57.0, 36.0, 44.0, 35.0, 48.0, 39.0, 41.0, 31.0, 35.0, 30.0, 27.0, 17.0, 22.0, 23.0, 15.0, 16.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8682861328125, -12.455322265625, -12.0423583984375, -11.62939453125, -11.2164306640625, -10.803466796875, -10.3905029296875, -9.9775390625, -9.5645751953125, -9.151611328125, -8.7386474609375, -8.32568359375, -7.9127197265625, -7.499755859375, -7.0867919921875, -6.673828125, -6.2608642578125, -5.847900390625, -5.4349365234375, -5.02197265625, -4.6090087890625, -4.196044921875, -3.7830810546875, -3.3701171875, -2.9571533203125, -2.544189453125, -2.1312255859375, -1.71826171875, -1.3052978515625, -0.892333984375, -0.4793701171875, -0.06640625, 0.3465576171875, 0.759521484375, 1.1724853515625, 1.58544921875, 1.9984130859375, 2.411376953125, 2.8243408203125, 3.2373046875, 3.6502685546875, 4.063232421875, 4.4761962890625, 4.88916015625, 5.3021240234375, 5.715087890625, 6.1280517578125, 6.541015625, 6.9539794921875, 7.366943359375, 7.7799072265625, 8.19287109375, 8.6058349609375, 9.018798828125, 9.4317626953125, 9.8447265625, 10.2576904296875, 10.670654296875, 11.0836181640625, 11.49658203125, 11.9095458984375, 12.322509765625, 12.7354736328125, 13.1484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 12.0, 30.0, 38.0, 63.0, 85.0, 145.0, 367.0, 869.0, 3126.0, 14965.0, 214076.0, 765664.0, 40579.0, 5883.0, 1553.0, 573.0, 231.0, 110.0, 62.0, 42.0, 30.0, 15.0, 11.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.89013671875, -15.3271484375, -14.76416015625, -14.201171875, -13.63818359375, -13.0751953125, -12.51220703125, -11.94921875, -11.38623046875, -10.8232421875, -10.26025390625, -9.697265625, -9.13427734375, -8.5712890625, -8.00830078125, -7.4453125, -6.88232421875, -6.3193359375, -5.75634765625, -5.193359375, -4.63037109375, -4.0673828125, -3.50439453125, -2.94140625, -2.37841796875, -1.8154296875, -1.25244140625, -0.689453125, -0.12646484375, 0.4365234375, 0.99951171875, 1.5625, 2.12548828125, 2.6884765625, 3.25146484375, 3.814453125, 4.37744140625, 4.9404296875, 5.50341796875, 6.06640625, 6.62939453125, 7.1923828125, 7.75537109375, 8.318359375, 8.88134765625, 9.4443359375, 10.00732421875, 10.5703125, 11.13330078125, 11.6962890625, 12.25927734375, 12.822265625, 13.38525390625, 13.9482421875, 14.51123046875, 15.07421875, 15.63720703125, 16.2001953125, 16.76318359375, 17.326171875, 17.88916015625, 18.4521484375, 19.01513671875, 19.578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 3.0, 5.0, 5.0, 6.0, 11.0, 9.0, 10.0, 25.0, 28.0, 28.0, 54.0, 103.0, 170.0, 204.0, 118.0, 66.0, 29.0, 20.0, 17.0, 17.0, 9.0, 11.0, 10.0, 7.0, 10.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001369476318359375, -0.001326829195022583, -0.001284182071685791, -0.001241534948348999, -0.001198887825012207, -0.001156240701675415, -0.001113593578338623, -0.001070946455001831, -0.001028299331665039, -0.000985652208328247, -0.0009430050849914551, -0.0009003579616546631, -0.0008577108383178711, -0.0008150637149810791, -0.0007724165916442871, -0.0007297694683074951, -0.0006871223449707031, -0.0006444752216339111, -0.0006018280982971191, -0.0005591809749603271, -0.0005165338516235352, -0.00047388672828674316, -0.00043123960494995117, -0.0003885924816131592, -0.0003459453582763672, -0.0003032982349395752, -0.0002606511116027832, -0.0002180039882659912, -0.00017535686492919922, -0.00013270974159240723, -9.006261825561523e-05, -4.741549491882324e-05, -4.76837158203125e-06, 3.787875175476074e-05, 8.052587509155273e-05, 0.00012317299842834473, 0.00016582012176513672, 0.0002084672451019287, 0.0002511143684387207, 0.0002937614917755127, 0.0003364086151123047, 0.0003790557384490967, 0.00042170286178588867, 0.00046434998512268066, 0.0005069971084594727, 0.0005496442317962646, 0.0005922913551330566, 0.0006349384784698486, 0.0006775856018066406, 0.0007202327251434326, 0.0007628798484802246, 0.0008055269718170166, 0.0008481740951538086, 0.0008908212184906006, 0.0009334683418273926, 0.0009761154651641846, 0.0010187625885009766, 0.0010614097118377686, 0.0011040568351745605, 0.0011467039585113525, 0.0011893510818481445, 0.0012319982051849365, 0.0012746453285217285, 0.0013172924518585205, 0.0013599395751953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 13.0, 7.0, 6.0, 15.0, 24.0, 30.0, 34.0, 59.0, 75.0, 125.0, 189.0, 299.0, 531.0, 781.0, 1374.0, 2482.0, 4879.0, 10943.0, 32042.0, 162570.0, 629396.0, 150680.0, 30768.0, 10625.0, 4721.0, 2405.0, 1309.0, 796.0, 499.0, 281.0, 201.0, 117.0, 89.0, 51.0, 40.0, 18.0, 17.0, 14.0, 14.0, 9.0, 12.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.449462890625, -9.11767578125, -8.785888671875, -8.4541015625, -8.122314453125, -7.79052734375, -7.458740234375, -7.126953125, -6.795166015625, -6.46337890625, -6.131591796875, -5.7998046875, -5.468017578125, -5.13623046875, -4.804443359375, -4.47265625, -4.140869140625, -3.80908203125, -3.477294921875, -3.1455078125, -2.813720703125, -2.48193359375, -2.150146484375, -1.818359375, -1.486572265625, -1.15478515625, -0.822998046875, -0.4912109375, -0.159423828125, 0.17236328125, 0.504150390625, 0.8359375, 1.167724609375, 1.49951171875, 1.831298828125, 2.1630859375, 2.494873046875, 2.82666015625, 3.158447265625, 3.490234375, 3.822021484375, 4.15380859375, 4.485595703125, 4.8173828125, 5.149169921875, 5.48095703125, 5.812744140625, 6.14453125, 6.476318359375, 6.80810546875, 7.139892578125, 7.4716796875, 7.803466796875, 8.13525390625, 8.467041015625, 8.798828125, 9.130615234375, 9.46240234375, 9.794189453125, 10.1259765625, 10.457763671875, 10.78955078125, 11.121337890625, 11.453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 8.0, 13.0, 11.0, 19.0, 40.0, 50.0, 71.0, 67.0, 112.0, 150.0, 125.0, 85.0, 67.0, 41.0, 26.0, 22.0, 18.0, 16.0, 13.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9298095703125, -9.625244140625, -9.3206787109375, -9.01611328125, -8.7115478515625, -8.406982421875, -8.1024169921875, -7.7978515625, -7.4932861328125, -7.188720703125, -6.8841552734375, -6.57958984375, -6.2750244140625, -5.970458984375, -5.6658935546875, -5.361328125, -5.0567626953125, -4.752197265625, -4.4476318359375, -4.14306640625, -3.8385009765625, -3.533935546875, -3.2293701171875, -2.9248046875, -2.6202392578125, -2.315673828125, -2.0111083984375, -1.70654296875, -1.4019775390625, -1.097412109375, -0.7928466796875, -0.48828125, -0.1837158203125, 0.120849609375, 0.4254150390625, 0.72998046875, 1.0345458984375, 1.339111328125, 1.6436767578125, 1.9482421875, 2.2528076171875, 2.557373046875, 2.8619384765625, 3.16650390625, 3.4710693359375, 3.775634765625, 4.0802001953125, 4.384765625, 4.6893310546875, 4.993896484375, 5.2984619140625, 5.60302734375, 5.9075927734375, 6.212158203125, 6.5167236328125, 6.8212890625, 7.1258544921875, 7.430419921875, 7.7349853515625, 8.03955078125, 8.3441162109375, 8.648681640625, 8.9532470703125, 9.2578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 20.0, 19.0, 46.0, 102.0, 139.0, 184.0, 170.0, 125.0, 94.0, 56.0, 29.0, 17.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.27543640136719, -74.3579330444336, -69.4404296875, -64.52291870117188, -59.60541534423828, -54.68791198730469, -49.77040481567383, -44.85289764404297, -39.935394287109375, -35.01789093017578, -30.100383758544922, -25.182878494262695, -20.26537322998047, -15.347867965698242, -10.430362701416016, -5.512855529785156, -0.5953521728515625, 4.322153091430664, 9.23965835571289, 14.157163619995117, 19.074668884277344, 23.99217414855957, 28.909679412841797, 33.827186584472656, 38.74468994140625, 43.662193298339844, 48.5797004699707, 53.49720764160156, 58.414710998535156, 63.33221435546875, 68.24972534179688, 73.16722869873047, 78.08473205566406, 83.00223541259766, 87.91973876953125, 92.83724975585938, 97.75475311279297, 102.67225646972656, 107.58976745605469, 112.50727081298828, 117.42477416992188, 122.34227752685547, 127.25978088378906, 132.1772918701172, 137.09478759765625, 142.01229858398438, 146.9298095703125, 151.84732055664062, 156.7648162841797, 161.6823272705078, 166.59982299804688, 171.517333984375, 176.43484497070312, 181.3523406982422, 186.2698516845703, 191.18734741210938, 196.1048583984375, 201.02236938476562, 205.9398651123047, 210.8573760986328, 215.77487182617188, 220.6923828125, 225.60989379882812, 230.52740478515625, 235.4449005126953]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 22.0, 13.0, 18.0, 23.0, 38.0, 29.0, 29.0, 42.0, 42.0, 46.0, 48.0, 33.0, 34.0, 56.0, 45.0, 41.0, 36.0, 36.0, 42.0, 39.0, 39.0, 39.0, 25.0, 31.0, 18.0, 19.0, 12.0, 13.0, 12.0, 3.0, 6.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-65.46266174316406, -63.459285736083984, -61.455909729003906, -59.45252990722656, -57.449153900146484, -55.445777893066406, -53.44239807128906, -51.439022064208984, -49.435646057128906, -47.43227005004883, -45.42889404296875, -43.425514221191406, -41.42213821411133, -39.41876220703125, -37.415382385253906, -35.41200637817383, -33.40863037109375, -31.405254364013672, -29.40187644958496, -27.39849853515625, -25.395122528076172, -23.391746520996094, -21.388368606567383, -19.384990692138672, -17.381614685058594, -15.3782377243042, -13.374860763549805, -11.37148380279541, -9.368106842041016, -7.364729881286621, -5.361352920532227, -3.357975959777832, -1.3546066284179688, 0.6487703323364258, 2.6521472930908203, 4.655524253845215, 6.658901214599609, 8.662278175354004, 10.665655136108398, 12.669032096862793, 14.672409057617188, 16.675785064697266, 18.679162979125977, 20.682540893554688, 22.685916900634766, 24.689292907714844, 26.692670822143555, 28.696048736572266, 30.699424743652344, 32.70280075073242, 34.7061767578125, 36.709556579589844, 38.71293258666992, 40.71630859375, 42.719688415527344, 44.72306442260742, 46.7264404296875, 48.72981643676758, 50.733192443847656, 52.736572265625, 54.73994827270508, 56.743324279785156, 58.7467041015625, 60.75008010864258, 62.753456115722656]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 10.0, 7.0, 13.0, 25.0, 16.0, 32.0, 24.0, 43.0, 68.0, 97.0, 147.0, 175.0, 278.0, 405.0, 614.0, 980.0, 1613.0, 2821.0, 5023.0, 9800.0, 21426.0, 55353.0, 210935.0, 3191116.0, 535196.0, 94970.0, 32388.0, 14277.0, 7006.0, 3759.0, 2108.0, 1240.0, 759.0, 497.0, 333.0, 211.0, 156.0, 108.0, 80.0, 44.0, 37.0, 22.0, 17.0, 12.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-23.3125, -22.621337890625, -21.93017578125, -21.239013671875, -20.5478515625, -19.856689453125, -19.16552734375, -18.474365234375, -17.783203125, -17.092041015625, -16.40087890625, -15.709716796875, -15.0185546875, -14.327392578125, -13.63623046875, -12.945068359375, -12.25390625, -11.562744140625, -10.87158203125, -10.180419921875, -9.4892578125, -8.798095703125, -8.10693359375, -7.415771484375, -6.724609375, -6.033447265625, -5.34228515625, -4.651123046875, -3.9599609375, -3.268798828125, -2.57763671875, -1.886474609375, -1.1953125, -0.504150390625, 0.18701171875, 0.878173828125, 1.5693359375, 2.260498046875, 2.95166015625, 3.642822265625, 4.333984375, 5.025146484375, 5.71630859375, 6.407470703125, 7.0986328125, 7.789794921875, 8.48095703125, 9.172119140625, 9.86328125, 10.554443359375, 11.24560546875, 11.936767578125, 12.6279296875, 13.319091796875, 14.01025390625, 14.701416015625, 15.392578125, 16.083740234375, 16.77490234375, 17.466064453125, 18.1572265625, 18.848388671875, 19.53955078125, 20.230712890625, 20.921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 12.0, 7.0, 13.0, 18.0, 14.0, 17.0, 27.0, 25.0, 22.0, 43.0, 36.0, 48.0, 38.0, 50.0, 47.0, 56.0, 31.0, 34.0, 48.0, 38.0, 46.0, 32.0, 45.0, 34.0, 39.0, 39.0, 23.0, 18.0, 11.0, 13.0, 18.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.888671875, -2.79107666015625, -2.6934814453125, -2.59588623046875, -2.498291015625, -2.40069580078125, -2.3031005859375, -2.20550537109375, -2.10791015625, -2.01031494140625, -1.9127197265625, -1.81512451171875, -1.717529296875, -1.61993408203125, -1.5223388671875, -1.42474365234375, -1.3271484375, -1.22955322265625, -1.1319580078125, -1.03436279296875, -0.936767578125, -0.83917236328125, -0.7415771484375, -0.64398193359375, -0.54638671875, -0.44879150390625, -0.3511962890625, -0.25360107421875, -0.156005859375, -0.05841064453125, 0.0391845703125, 0.13677978515625, 0.234375, 0.33197021484375, 0.4295654296875, 0.52716064453125, 0.624755859375, 0.72235107421875, 0.8199462890625, 0.91754150390625, 1.01513671875, 1.11273193359375, 1.2103271484375, 1.30792236328125, 1.405517578125, 1.50311279296875, 1.6007080078125, 1.69830322265625, 1.7958984375, 1.89349365234375, 1.9910888671875, 2.08868408203125, 2.186279296875, 2.28387451171875, 2.3814697265625, 2.47906494140625, 2.57666015625, 2.67425537109375, 2.7718505859375, 2.86944580078125, 2.967041015625, 3.06463623046875, 3.1622314453125, 3.25982666015625, 3.357421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 19.0, 18.0, 19.0, 35.0, 34.0, 75.0, 102.0, 162.0, 255.0, 418.0, 692.0, 1376.0, 2557.0, 5616.0, 13397.0, 36560.0, 128500.0, 973631.0, 2761622.0, 189555.0, 48937.0, 16962.0, 6888.0, 3136.0, 1682.0, 775.0, 451.0, 258.0, 154.0, 103.0, 76.0, 61.0, 39.0, 29.0, 17.0, 14.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.110595703125, -18.53369140625, -17.956787109375, -17.3798828125, -16.802978515625, -16.22607421875, -15.649169921875, -15.072265625, -14.495361328125, -13.91845703125, -13.341552734375, -12.7646484375, -12.187744140625, -11.61083984375, -11.033935546875, -10.45703125, -9.880126953125, -9.30322265625, -8.726318359375, -8.1494140625, -7.572509765625, -6.99560546875, -6.418701171875, -5.841796875, -5.264892578125, -4.68798828125, -4.111083984375, -3.5341796875, -2.957275390625, -2.38037109375, -1.803466796875, -1.2265625, -0.649658203125, -0.07275390625, 0.504150390625, 1.0810546875, 1.657958984375, 2.23486328125, 2.811767578125, 3.388671875, 3.965576171875, 4.54248046875, 5.119384765625, 5.6962890625, 6.273193359375, 6.85009765625, 7.427001953125, 8.00390625, 8.580810546875, 9.15771484375, 9.734619140625, 10.3115234375, 10.888427734375, 11.46533203125, 12.042236328125, 12.619140625, 13.196044921875, 13.77294921875, 14.349853515625, 14.9267578125, 15.503662109375, 16.08056640625, 16.657470703125, 17.234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 15.0, 12.0, 23.0, 34.0, 54.0, 61.0, 108.0, 230.0, 486.0, 1653.0, 634.0, 308.0, 147.0, 85.0, 63.0, 47.0, 28.0, 17.0, 11.0, 7.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.953125, -8.6876220703125, -8.422119140625, -8.1566162109375, -7.89111328125, -7.6256103515625, -7.360107421875, -7.0946044921875, -6.8291015625, -6.5635986328125, -6.298095703125, -6.0325927734375, -5.76708984375, -5.5015869140625, -5.236083984375, -4.9705810546875, -4.705078125, -4.4395751953125, -4.174072265625, -3.9085693359375, -3.64306640625, -3.3775634765625, -3.112060546875, -2.8465576171875, -2.5810546875, -2.3155517578125, -2.050048828125, -1.7845458984375, -1.51904296875, -1.2535400390625, -0.988037109375, -0.7225341796875, -0.45703125, -0.1915283203125, 0.073974609375, 0.3394775390625, 0.60498046875, 0.8704833984375, 1.135986328125, 1.4014892578125, 1.6669921875, 1.9324951171875, 2.197998046875, 2.4635009765625, 2.72900390625, 2.9945068359375, 3.260009765625, 3.5255126953125, 3.791015625, 4.0565185546875, 4.322021484375, 4.5875244140625, 4.85302734375, 5.1185302734375, 5.384033203125, 5.6495361328125, 5.9150390625, 6.1805419921875, 6.446044921875, 6.7115478515625, 6.97705078125, 7.2425537109375, 7.508056640625, 7.7735595703125, 8.0390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 11.0, 7.0, 6.0, 9.0, 20.0, 21.0, 38.0, 54.0, 96.0, 109.0, 127.0, 126.0, 109.0, 94.0, 67.0, 35.0, 39.0, 17.0, 9.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.28128051757812, -68.7434310913086, -67.2055892944336, -65.66773986816406, -64.12989044189453, -62.59204864501953, -61.05419921875, -59.516353607177734, -57.97850799560547, -56.4406623840332, -54.90281295776367, -53.364967346191406, -51.82712173461914, -50.289276123046875, -48.751426696777344, -47.21358108520508, -45.67573547363281, -44.13788986206055, -42.600040435791016, -41.06219482421875, -39.524349212646484, -37.98650360107422, -36.44865417480469, -34.91080856323242, -33.37295913696289, -31.835111618041992, -30.297266006469727, -28.759418487548828, -27.221572875976562, -25.683725357055664, -24.145877838134766, -22.6080322265625, -21.070188522338867, -19.53234100341797, -17.994495391845703, -16.456647872924805, -14.918802261352539, -13.38095474243164, -11.843108177185059, -10.305261611938477, -8.767415046691895, -7.2295684814453125, -5.6917219161987305, -4.15387487411499, -2.616028308868408, -1.0781817436218262, 0.45966529846191406, 1.997511863708496, 3.535358428955078, 5.07320499420166, 6.611051559448242, 8.14889907836914, 9.686744689941406, 11.224592208862305, 12.762438774108887, 14.300285339355469, 15.83813190460205, 17.375978469848633, 18.91382598876953, 20.451671600341797, 21.989519119262695, 23.52736473083496, 25.06521224975586, 26.603057861328125, 28.140905380249023]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 11.0, 10.0, 9.0, 14.0, 17.0, 16.0, 26.0, 32.0, 29.0, 41.0, 32.0, 36.0, 46.0, 43.0, 37.0, 42.0, 38.0, 52.0, 35.0, 48.0, 40.0, 37.0, 58.0, 36.0, 29.0, 31.0, 24.0, 22.0, 21.0, 10.0, 19.0, 10.0, 4.0, 7.0, 2.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.436439514160156, -25.6163387298584, -24.79623794555664, -23.976137161254883, -23.156036376953125, -22.335933685302734, -21.515832901000977, -20.69573211669922, -19.87563133239746, -19.055530548095703, -18.235429763793945, -17.415328979492188, -16.595226287841797, -15.775126457214355, -14.955024719238281, -14.134923934936523, -13.314823150634766, -12.494722366333008, -11.67462158203125, -10.854519844055176, -10.034419059753418, -9.21431827545166, -8.394216537475586, -7.574115753173828, -6.75401496887207, -5.9339141845703125, -5.1138129234313965, -4.2937116622924805, -3.4736108779907227, -2.653510093688965, -1.8334088325500488, -1.0133075714111328, -0.1932086944580078, 0.6268923282623291, 1.446993350982666, 2.267094373703003, 3.08719539642334, 3.9072961807250977, 4.727397441864014, 5.54749870300293, 6.3675994873046875, 7.187700271606445, 8.007801055908203, 8.827902793884277, 9.648003578186035, 10.468104362487793, 11.288206100463867, 12.108306884765625, 12.928407669067383, 13.74850845336914, 14.568609237670898, 15.388710975646973, 16.208812713623047, 17.028911590576172, 17.849014282226562, 18.66911506652832, 19.489215850830078, 20.309316635131836, 21.129417419433594, 21.94951820373535, 22.76961898803711, 23.5897216796875, 24.409822463989258, 25.229923248291016, 26.050024032592773]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 12.0, 22.0, 30.0, 48.0, 68.0, 109.0, 217.0, 351.0, 569.0, 1144.0, 2368.0, 5256.0, 12797.0, 34871.0, 94199.0, 246733.0, 375501.0, 170368.0, 63832.0, 23607.0, 8883.0, 3813.0, 1781.0, 866.0, 438.0, 295.0, 152.0, 75.0, 52.0, 33.0, 22.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.793212890625, -17.16455078125, -16.535888671875, -15.9072265625, -15.278564453125, -14.64990234375, -14.021240234375, -13.392578125, -12.763916015625, -12.13525390625, -11.506591796875, -10.8779296875, -10.249267578125, -9.62060546875, -8.991943359375, -8.36328125, -7.734619140625, -7.10595703125, -6.477294921875, -5.8486328125, -5.219970703125, -4.59130859375, -3.962646484375, -3.333984375, -2.705322265625, -2.07666015625, -1.447998046875, -0.8193359375, -0.190673828125, 0.43798828125, 1.066650390625, 1.6953125, 2.323974609375, 2.95263671875, 3.581298828125, 4.2099609375, 4.838623046875, 5.46728515625, 6.095947265625, 6.724609375, 7.353271484375, 7.98193359375, 8.610595703125, 9.2392578125, 9.867919921875, 10.49658203125, 11.125244140625, 11.75390625, 12.382568359375, 13.01123046875, 13.639892578125, 14.2685546875, 14.897216796875, 15.52587890625, 16.154541015625, 16.783203125, 17.411865234375, 18.04052734375, 18.669189453125, 19.2978515625, 19.926513671875, 20.55517578125, 21.183837890625, 21.8125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 9.0, 10.0, 15.0, 16.0, 16.0, 31.0, 26.0, 24.0, 27.0, 42.0, 56.0, 53.0, 53.0, 55.0, 53.0, 50.0, 43.0, 37.0, 46.0, 44.0, 47.0, 35.0, 34.0, 38.0, 21.0, 16.0, 19.0, 20.0, 11.0, 12.0, 7.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.255859375, -3.141693115234375, -3.02752685546875, -2.913360595703125, -2.7991943359375, -2.685028076171875, -2.57086181640625, -2.456695556640625, -2.342529296875, -2.228363037109375, -2.11419677734375, -2.000030517578125, -1.8858642578125, -1.771697998046875, -1.65753173828125, -1.543365478515625, -1.42919921875, -1.315032958984375, -1.20086669921875, -1.086700439453125, -0.9725341796875, -0.858367919921875, -0.74420166015625, -0.630035400390625, -0.515869140625, -0.401702880859375, -0.28753662109375, -0.173370361328125, -0.0592041015625, 0.054962158203125, 0.16912841796875, 0.283294677734375, 0.3974609375, 0.511627197265625, 0.62579345703125, 0.739959716796875, 0.8541259765625, 0.968292236328125, 1.08245849609375, 1.196624755859375, 1.310791015625, 1.424957275390625, 1.53912353515625, 1.653289794921875, 1.7674560546875, 1.881622314453125, 1.99578857421875, 2.109954833984375, 2.22412109375, 2.338287353515625, 2.45245361328125, 2.566619873046875, 2.6807861328125, 2.794952392578125, 2.90911865234375, 3.023284912109375, 3.137451171875, 3.251617431640625, 3.36578369140625, 3.479949951171875, 3.5941162109375, 3.708282470703125, 3.82244873046875, 3.936614990234375, 4.05078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 12.0, 9.0, 13.0, 22.0, 16.0, 32.0, 33.0, 37.0, 63.0, 58.0, 87.0, 78.0, 132.0, 157.0, 223.0, 292.0, 382.0, 513.0, 850.0, 1728.0, 4799.0, 18268.0, 84723.0, 371706.0, 430680.0, 101306.0, 21719.0, 5414.0, 1935.0, 926.0, 583.0, 364.0, 311.0, 234.0, 167.0, 142.0, 118.0, 86.0, 67.0, 46.0, 41.0, 40.0, 30.0, 30.0, 22.0, 15.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.25, -20.587158203125, -19.92431640625, -19.261474609375, -18.5986328125, -17.935791015625, -17.27294921875, -16.610107421875, -15.947265625, -15.284423828125, -14.62158203125, -13.958740234375, -13.2958984375, -12.633056640625, -11.97021484375, -11.307373046875, -10.64453125, -9.981689453125, -9.31884765625, -8.656005859375, -7.9931640625, -7.330322265625, -6.66748046875, -6.004638671875, -5.341796875, -4.678955078125, -4.01611328125, -3.353271484375, -2.6904296875, -2.027587890625, -1.36474609375, -0.701904296875, -0.0390625, 0.623779296875, 1.28662109375, 1.949462890625, 2.6123046875, 3.275146484375, 3.93798828125, 4.600830078125, 5.263671875, 5.926513671875, 6.58935546875, 7.252197265625, 7.9150390625, 8.577880859375, 9.24072265625, 9.903564453125, 10.56640625, 11.229248046875, 11.89208984375, 12.554931640625, 13.2177734375, 13.880615234375, 14.54345703125, 15.206298828125, 15.869140625, 16.531982421875, 17.19482421875, 17.857666015625, 18.5205078125, 19.183349609375, 19.84619140625, 20.509033203125, 21.171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 10.0, 12.0, 13.0, 17.0, 19.0, 17.0, 19.0, 29.0, 28.0, 41.0, 30.0, 27.0, 38.0, 36.0, 32.0, 51.0, 46.0, 51.0, 42.0, 43.0, 43.0, 43.0, 37.0, 42.0, 31.0, 32.0, 26.0, 16.0, 11.0, 14.0, 14.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.390625, -13.9525146484375, -13.514404296875, -13.0762939453125, -12.63818359375, -12.2000732421875, -11.761962890625, -11.3238525390625, -10.8857421875, -10.4476318359375, -10.009521484375, -9.5714111328125, -9.13330078125, -8.6951904296875, -8.257080078125, -7.8189697265625, -7.380859375, -6.9427490234375, -6.504638671875, -6.0665283203125, -5.62841796875, -5.1903076171875, -4.752197265625, -4.3140869140625, -3.8759765625, -3.4378662109375, -2.999755859375, -2.5616455078125, -2.12353515625, -1.6854248046875, -1.247314453125, -0.8092041015625, -0.37109375, 0.0670166015625, 0.505126953125, 0.9432373046875, 1.38134765625, 1.8194580078125, 2.257568359375, 2.6956787109375, 3.1337890625, 3.5718994140625, 4.010009765625, 4.4481201171875, 4.88623046875, 5.3243408203125, 5.762451171875, 6.2005615234375, 6.638671875, 7.0767822265625, 7.514892578125, 7.9530029296875, 8.39111328125, 8.8292236328125, 9.267333984375, 9.7054443359375, 10.1435546875, 10.5816650390625, 11.019775390625, 11.4578857421875, 11.89599609375, 12.3341064453125, 12.772216796875, 13.2103271484375, 13.6484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 19.0, 21.0, 33.0, 65.0, 116.0, 303.0, 723.0, 2587.0, 13211.0, 136857.0, 778676.0, 101832.0, 10671.0, 2196.0, 701.0, 264.0, 120.0, 58.0, 27.0, 21.0, 15.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.515625, -21.88037109375, -21.2451171875, -20.60986328125, -19.974609375, -19.33935546875, -18.7041015625, -18.06884765625, -17.43359375, -16.79833984375, -16.1630859375, -15.52783203125, -14.892578125, -14.25732421875, -13.6220703125, -12.98681640625, -12.3515625, -11.71630859375, -11.0810546875, -10.44580078125, -9.810546875, -9.17529296875, -8.5400390625, -7.90478515625, -7.26953125, -6.63427734375, -5.9990234375, -5.36376953125, -4.728515625, -4.09326171875, -3.4580078125, -2.82275390625, -2.1875, -1.55224609375, -0.9169921875, -0.28173828125, 0.353515625, 0.98876953125, 1.6240234375, 2.25927734375, 2.89453125, 3.52978515625, 4.1650390625, 4.80029296875, 5.435546875, 6.07080078125, 6.7060546875, 7.34130859375, 7.9765625, 8.61181640625, 9.2470703125, 9.88232421875, 10.517578125, 11.15283203125, 11.7880859375, 12.42333984375, 13.05859375, 13.69384765625, 14.3291015625, 14.96435546875, 15.599609375, 16.23486328125, 16.8701171875, 17.50537109375, 18.140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 16.0, 24.0, 23.0, 40.0, 45.0, 70.0, 106.0, 169.0, 193.0, 87.0, 53.0, 43.0, 31.0, 27.0, 12.0, 14.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.003566741943359375, -0.003490731120109558, -0.003414720296859741, -0.0033387094736099243, -0.0032626986503601074, -0.0031866878271102905, -0.0031106770038604736, -0.0030346661806106567, -0.00295865535736084, -0.002882644534111023, -0.002806633710861206, -0.002730622887611389, -0.0026546120643615723, -0.0025786012411117554, -0.0025025904178619385, -0.0024265795946121216, -0.0023505687713623047, -0.002274557948112488, -0.002198547124862671, -0.002122536301612854, -0.002046525478363037, -0.00197051465511322, -0.0018945038318634033, -0.0018184930086135864, -0.0017424821853637695, -0.0016664713621139526, -0.0015904605388641357, -0.0015144497156143188, -0.001438438892364502, -0.001362428069114685, -0.0012864172458648682, -0.0012104064226150513, -0.0011343955993652344, -0.0010583847761154175, -0.0009823739528656006, -0.0009063631296157837, -0.0008303523063659668, -0.0007543414831161499, -0.000678330659866333, -0.0006023198366165161, -0.0005263090133666992, -0.0004502981901168823, -0.00037428736686706543, -0.00029827654361724854, -0.00022226572036743164, -0.00014625489711761475, -7.024407386779785e-05, 5.766749382019043e-06, 8.177757263183594e-05, 0.00015778839588165283, 0.00023379921913146973, 0.0003098100423812866, 0.0003858208656311035, 0.0004618316888809204, 0.0005378425121307373, 0.0006138533353805542, 0.0006898641586303711, 0.000765874981880188, 0.0008418858051300049, 0.0009178966283798218, 0.0009939074516296387, 0.0010699182748794556, 0.0011459290981292725, 0.0012219399213790894, 0.0012979507446289062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 8.0, 10.0, 17.0, 50.0, 71.0, 110.0, 174.0, 388.0, 1011.0, 4323.0, 65754.0, 903294.0, 67108.0, 4298.0, 973.0, 412.0, 208.0, 135.0, 83.0, 43.0, 31.0, 16.0, 11.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.436279296875, -33.46630859375, -32.496337890625, -31.5263671875, -30.556396484375, -29.58642578125, -28.616455078125, -27.646484375, -26.676513671875, -25.70654296875, -24.736572265625, -23.7666015625, -22.796630859375, -21.82666015625, -20.856689453125, -19.88671875, -18.916748046875, -17.94677734375, -16.976806640625, -16.0068359375, -15.036865234375, -14.06689453125, -13.096923828125, -12.126953125, -11.156982421875, -10.18701171875, -9.217041015625, -8.2470703125, -7.277099609375, -6.30712890625, -5.337158203125, -4.3671875, -3.397216796875, -2.42724609375, -1.457275390625, -0.4873046875, 0.482666015625, 1.45263671875, 2.422607421875, 3.392578125, 4.362548828125, 5.33251953125, 6.302490234375, 7.2724609375, 8.242431640625, 9.21240234375, 10.182373046875, 11.15234375, 12.122314453125, 13.09228515625, 14.062255859375, 15.0322265625, 16.002197265625, 16.97216796875, 17.942138671875, 18.912109375, 19.882080078125, 20.85205078125, 21.822021484375, 22.7919921875, 23.761962890625, 24.73193359375, 25.701904296875, 26.671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 11.0, 27.0, 32.0, 37.0, 52.0, 75.0, 104.0, 99.0, 150.0, 105.0, 74.0, 50.0, 43.0, 25.0, 26.0, 20.0, 16.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8515625, -13.4691162109375, -13.086669921875, -12.7042236328125, -12.32177734375, -11.9393310546875, -11.556884765625, -11.1744384765625, -10.7919921875, -10.4095458984375, -10.027099609375, -9.6446533203125, -9.26220703125, -8.8797607421875, -8.497314453125, -8.1148681640625, -7.732421875, -7.3499755859375, -6.967529296875, -6.5850830078125, -6.20263671875, -5.8201904296875, -5.437744140625, -5.0552978515625, -4.6728515625, -4.2904052734375, -3.907958984375, -3.5255126953125, -3.14306640625, -2.7606201171875, -2.378173828125, -1.9957275390625, -1.61328125, -1.2308349609375, -0.848388671875, -0.4659423828125, -0.08349609375, 0.2989501953125, 0.681396484375, 1.0638427734375, 1.4462890625, 1.8287353515625, 2.211181640625, 2.5936279296875, 2.97607421875, 3.3585205078125, 3.740966796875, 4.1234130859375, 4.505859375, 4.8883056640625, 5.270751953125, 5.6531982421875, 6.03564453125, 6.4180908203125, 6.800537109375, 7.1829833984375, 7.5654296875, 7.9478759765625, 8.330322265625, 8.7127685546875, 9.09521484375, 9.4776611328125, 9.860107421875, 10.2425537109375, 10.625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 14.0, 29.0, 98.0, 229.0, 328.0, 194.0, 85.0, 24.0, 9.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.1737365722656, -389.239990234375, -378.3062744140625, -367.3725280761719, -356.4388122558594, -345.50506591796875, -334.57135009765625, -323.6376037597656, -312.703857421875, -301.7701110839844, -290.8363952636719, -279.90264892578125, -268.96893310546875, -258.0351867675781, -247.10145568847656, -236.167724609375, -225.2340087890625, -214.30027770996094, -203.36654663085938, -192.43280029296875, -181.49908447265625, -170.56533813476562, -159.63160705566406, -148.6978759765625, -137.76414489746094, -126.83041381835938, -115.89668273925781, -104.96294403076172, -94.02921295166016, -83.0954818725586, -72.1617431640625, -61.22801208496094, -50.2943115234375, -39.36058044433594, -28.42684555053711, -17.49311065673828, -6.559379577636719, 4.374351501464844, 15.308090209960938, 26.2418212890625, 37.17555236816406, 48.109283447265625, 59.04301834106445, 69.97675323486328, 80.91048431396484, 91.8442153930664, 102.7779541015625, 113.71168518066406, 124.64541625976562, 135.5791473388672, 146.51287841796875, 157.44662475585938, 168.38034057617188, 179.3140869140625, 190.24781799316406, 201.18154907226562, 212.1152801513672, 223.04901123046875, 233.9827423095703, 244.91647338867188, 255.8502197265625, 266.783935546875, 277.7176818847656, 288.65142822265625, 299.58514404296875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 8.0, 9.0, 13.0, 13.0, 12.0, 21.0, 20.0, 23.0, 21.0, 33.0, 36.0, 34.0, 34.0, 44.0, 34.0, 30.0, 30.0, 31.0, 51.0, 44.0, 42.0, 38.0, 52.0, 31.0, 39.0, 28.0, 31.0, 29.0, 28.0, 13.0, 26.0, 15.0, 16.0, 17.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-79.36653137207031, -77.12184143066406, -74.87715148925781, -72.63246154785156, -70.38777160644531, -68.14308166503906, -65.89839172363281, -63.65370178222656, -61.40901184082031, -59.16432189941406, -56.91963195800781, -54.67494201660156, -52.43025207519531, -50.18556213378906, -47.94087219238281, -45.69618225097656, -43.45149230957031, -41.20680236816406, -38.96211242675781, -36.71742248535156, -34.47273254394531, -32.22804260253906, -29.983352661132812, -27.738662719726562, -25.493972778320312, -23.249282836914062, -21.004592895507812, -18.759902954101562, -16.515213012695312, -14.270523071289062, -12.025833129882812, -9.781143188476562, -7.536445617675781, -5.291755676269531, -3.0470657348632812, -0.8023757934570312, 1.4423141479492188, 3.6870040893554688, 5.931694030761719, 8.176383972167969, 10.421073913574219, 12.665763854980469, 14.910453796386719, 17.15514373779297, 19.39983367919922, 21.64452362060547, 23.88921356201172, 26.13390350341797, 28.37859344482422, 30.62328338623047, 32.86797332763672, 35.11266326904297, 37.35735321044922, 39.60204315185547, 41.84673309326172, 44.09142303466797, 46.33611297607422, 48.58080291748047, 50.82549285888672, 53.07018280029297, 55.31487274169922, 57.55956268310547, 59.80425262451172, 62.04894256591797, 64.29363250732422]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 6.0, 16.0, 21.0, 42.0, 36.0, 61.0, 86.0, 130.0, 213.0, 301.0, 422.0, 698.0, 1246.0, 2079.0, 3990.0, 8053.0, 18524.0, 49165.0, 167850.0, 1205398.0, 2424258.0, 211326.0, 58315.0, 21611.0, 9487.0, 4728.0, 2434.0, 1406.0, 822.0, 524.0, 334.0, 190.0, 163.0, 107.0, 51.0, 63.0, 35.0, 23.0, 16.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.328125, -19.7799072265625, -19.231689453125, -18.6834716796875, -18.13525390625, -17.5870361328125, -17.038818359375, -16.4906005859375, -15.9423828125, -15.3941650390625, -14.845947265625, -14.2977294921875, -13.74951171875, -13.2012939453125, -12.653076171875, -12.1048583984375, -11.556640625, -11.0084228515625, -10.460205078125, -9.9119873046875, -9.36376953125, -8.8155517578125, -8.267333984375, -7.7191162109375, -7.1708984375, -6.6226806640625, -6.074462890625, -5.5262451171875, -4.97802734375, -4.4298095703125, -3.881591796875, -3.3333740234375, -2.78515625, -2.2369384765625, -1.688720703125, -1.1405029296875, -0.59228515625, -0.0440673828125, 0.504150390625, 1.0523681640625, 1.6005859375, 2.1488037109375, 2.697021484375, 3.2452392578125, 3.79345703125, 4.3416748046875, 4.889892578125, 5.4381103515625, 5.986328125, 6.5345458984375, 7.082763671875, 7.6309814453125, 8.17919921875, 8.7274169921875, 9.275634765625, 9.8238525390625, 10.3720703125, 10.9202880859375, 11.468505859375, 12.0167236328125, 12.56494140625, 13.1131591796875, 13.661376953125, 14.2095947265625, 14.7578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 11.0, 4.0, 11.0, 21.0, 24.0, 21.0, 17.0, 28.0, 33.0, 37.0, 52.0, 47.0, 36.0, 67.0, 49.0, 64.0, 52.0, 43.0, 42.0, 39.0, 36.0, 36.0, 36.0, 36.0, 34.0, 28.0, 19.0, 15.0, 10.0, 14.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.615234375, -3.493499755859375, -3.37176513671875, -3.250030517578125, -3.1282958984375, -3.006561279296875, -2.88482666015625, -2.763092041015625, -2.641357421875, -2.519622802734375, -2.39788818359375, -2.276153564453125, -2.1544189453125, -2.032684326171875, -1.91094970703125, -1.789215087890625, -1.66748046875, -1.545745849609375, -1.42401123046875, -1.302276611328125, -1.1805419921875, -1.058807373046875, -0.93707275390625, -0.815338134765625, -0.693603515625, -0.571868896484375, -0.45013427734375, -0.328399658203125, -0.2066650390625, -0.084930419921875, 0.03680419921875, 0.158538818359375, 0.2802734375, 0.402008056640625, 0.52374267578125, 0.645477294921875, 0.7672119140625, 0.888946533203125, 1.01068115234375, 1.132415771484375, 1.254150390625, 1.375885009765625, 1.49761962890625, 1.619354248046875, 1.7410888671875, 1.862823486328125, 1.98455810546875, 2.106292724609375, 2.22802734375, 2.349761962890625, 2.47149658203125, 2.593231201171875, 2.7149658203125, 2.836700439453125, 2.95843505859375, 3.080169677734375, 3.201904296875, 3.323638916015625, 3.44537353515625, 3.567108154296875, 3.6888427734375, 3.810577392578125, 3.93231201171875, 4.054046630859375, 4.17578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 8.0, 4.0, 10.0, 11.0, 17.0, 24.0, 26.0, 61.0, 65.0, 121.0, 190.0, 320.0, 510.0, 818.0, 1573.0, 2546.0, 5094.0, 10242.0, 23275.0, 60678.0, 193231.0, 967851.0, 2432273.0, 339201.0, 93972.0, 33561.0, 14069.0, 6648.0, 3447.0, 1820.0, 991.0, 634.0, 370.0, 203.0, 151.0, 106.0, 59.0, 46.0, 21.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.345703125, -12.91796875, -12.490234375, -12.0625, -11.634765625, -11.20703125, -10.779296875, -10.3515625, -9.923828125, -9.49609375, -9.068359375, -8.640625, -8.212890625, -7.78515625, -7.357421875, -6.9296875, -6.501953125, -6.07421875, -5.646484375, -5.21875, -4.791015625, -4.36328125, -3.935546875, -3.5078125, -3.080078125, -2.65234375, -2.224609375, -1.796875, -1.369140625, -0.94140625, -0.513671875, -0.0859375, 0.341796875, 0.76953125, 1.197265625, 1.625, 2.052734375, 2.48046875, 2.908203125, 3.3359375, 3.763671875, 4.19140625, 4.619140625, 5.046875, 5.474609375, 5.90234375, 6.330078125, 6.7578125, 7.185546875, 7.61328125, 8.041015625, 8.46875, 8.896484375, 9.32421875, 9.751953125, 10.1796875, 10.607421875, 11.03515625, 11.462890625, 11.890625, 12.318359375, 12.74609375, 13.173828125, 13.6015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 6.0, 12.0, 11.0, 13.0, 16.0, 40.0, 39.0, 64.0, 91.0, 149.0, 203.0, 328.0, 668.0, 1076.0, 464.0, 303.0, 162.0, 118.0, 69.0, 57.0, 47.0, 20.0, 25.0, 16.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.75225830078125, -8.4888916015625, -8.22552490234375, -7.962158203125, -7.69879150390625, -7.4354248046875, -7.17205810546875, -6.90869140625, -6.64532470703125, -6.3819580078125, -6.11859130859375, -5.855224609375, -5.59185791015625, -5.3284912109375, -5.06512451171875, -4.8017578125, -4.53839111328125, -4.2750244140625, -4.01165771484375, -3.748291015625, -3.48492431640625, -3.2215576171875, -2.95819091796875, -2.69482421875, -2.43145751953125, -2.1680908203125, -1.90472412109375, -1.641357421875, -1.37799072265625, -1.1146240234375, -0.85125732421875, -0.587890625, -0.32452392578125, -0.0611572265625, 0.20220947265625, 0.465576171875, 0.72894287109375, 0.9923095703125, 1.25567626953125, 1.51904296875, 1.78240966796875, 2.0457763671875, 2.30914306640625, 2.572509765625, 2.83587646484375, 3.0992431640625, 3.36260986328125, 3.6259765625, 3.88934326171875, 4.1527099609375, 4.41607666015625, 4.679443359375, 4.94281005859375, 5.2061767578125, 5.46954345703125, 5.73291015625, 5.99627685546875, 6.2596435546875, 6.52301025390625, 6.786376953125, 7.04974365234375, 7.3131103515625, 7.57647705078125, 7.83984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 27.0, 39.0, 116.0, 219.0, 246.0, 190.0, 90.0, 49.0, 15.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.73622131347656, -135.66502380371094, -131.5938262939453, -127.52262878417969, -123.45142364501953, -119.3802261352539, -115.30902862548828, -111.23783111572266, -107.1666259765625, -103.09542846679688, -99.02423095703125, -94.95303344726562, -90.88182830810547, -86.81063079833984, -82.73943328857422, -78.6682357788086, -74.59703826904297, -70.52584075927734, -66.45464324951172, -62.38344192504883, -58.31224060058594, -54.24104309082031, -50.16984558105469, -46.09864807128906, -42.02744674682617, -37.95624923706055, -33.885047912597656, -29.81385040283203, -25.742650985717773, -21.671451568603516, -17.60025405883789, -13.529054641723633, -9.457855224609375, -5.386656284332275, -1.3154573440551758, 2.7557411193847656, 6.826940536499023, 10.898139953613281, 14.969337463378906, 19.040536880493164, 23.111736297607422, 27.18293571472168, 31.254135131835938, 35.32533264160156, 39.39653015136719, 43.46773147583008, 47.5389289855957, 51.610130310058594, 55.68132781982422, 59.752525329589844, 63.823726654052734, 67.89492797851562, 71.96612548828125, 76.03732299804688, 80.1085205078125, 84.17971801757812, 88.25091552734375, 92.32211303710938, 96.393310546875, 100.46450805664062, 104.53571319580078, 108.6069107055664, 112.67810821533203, 116.74930572509766, 120.82051086425781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 19.0, 15.0, 19.0, 21.0, 24.0, 33.0, 40.0, 35.0, 40.0, 51.0, 46.0, 55.0, 58.0, 33.0, 32.0, 44.0, 51.0, 31.0, 40.0, 45.0, 42.0, 28.0, 26.0, 17.0, 20.0, 19.0, 17.0, 18.0, 12.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.3070068359375, -29.253692626953125, -28.200380325317383, -27.14706802368164, -26.093753814697266, -25.04043960571289, -23.98712730407715, -22.933815002441406, -21.88050079345703, -20.827186584472656, -19.773874282836914, -18.720561981201172, -17.667247772216797, -16.613933563232422, -15.56062126159668, -14.507308006286621, -13.453994750976562, -12.400681495666504, -11.347368240356445, -10.294054985046387, -9.240741729736328, -8.18742847442627, -7.134115219116211, -6.080801963806152, -5.027488708496094, -3.974175453186035, -2.9208621978759766, -1.867548942565918, -0.8142356872558594, 0.23907756805419922, 1.2923908233642578, 2.3457040786743164, 3.3990211486816406, 4.452334403991699, 5.505647659301758, 6.558960914611816, 7.612274169921875, 8.665587425231934, 9.718900680541992, 10.77221393585205, 11.82552719116211, 12.878840446472168, 13.932153701782227, 14.985466957092285, 16.038780212402344, 17.09209442138672, 18.14540672302246, 19.198719024658203, 20.252033233642578, 21.305347442626953, 22.358659744262695, 23.411972045898438, 24.465286254882812, 25.518600463867188, 26.57191276550293, 27.625225067138672, 28.678539276123047, 29.731853485107422, 30.785165786743164, 31.838478088378906, 32.89179229736328, 33.945106506347656, 34.99842071533203, 36.05173110961914, 37.105045318603516]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 17.0, 22.0, 26.0, 39.0, 70.0, 105.0, 163.0, 297.0, 467.0, 884.0, 1658.0, 3677.0, 8158.0, 19506.0, 49647.0, 131970.0, 297608.0, 305903.0, 138566.0, 52563.0, 20719.0, 8687.0, 3852.0, 1759.0, 900.0, 475.0, 305.0, 167.0, 109.0, 87.0, 48.0, 35.0, 25.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.953125, -17.392578125, -16.83203125, -16.271484375, -15.7109375, -15.150390625, -14.58984375, -14.029296875, -13.46875, -12.908203125, -12.34765625, -11.787109375, -11.2265625, -10.666015625, -10.10546875, -9.544921875, -8.984375, -8.423828125, -7.86328125, -7.302734375, -6.7421875, -6.181640625, -5.62109375, -5.060546875, -4.5, -3.939453125, -3.37890625, -2.818359375, -2.2578125, -1.697265625, -1.13671875, -0.576171875, -0.015625, 0.544921875, 1.10546875, 1.666015625, 2.2265625, 2.787109375, 3.34765625, 3.908203125, 4.46875, 5.029296875, 5.58984375, 6.150390625, 6.7109375, 7.271484375, 7.83203125, 8.392578125, 8.953125, 9.513671875, 10.07421875, 10.634765625, 11.1953125, 11.755859375, 12.31640625, 12.876953125, 13.4375, 13.998046875, 14.55859375, 15.119140625, 15.6796875, 16.240234375, 16.80078125, 17.361328125, 17.921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 9.0, 15.0, 10.0, 18.0, 20.0, 16.0, 28.0, 35.0, 40.0, 56.0, 34.0, 52.0, 54.0, 49.0, 53.0, 50.0, 40.0, 47.0, 44.0, 43.0, 40.0, 41.0, 39.0, 22.0, 22.0, 16.0, 24.0, 16.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.623046875, -3.495330810546875, -3.36761474609375, -3.239898681640625, -3.1121826171875, -2.984466552734375, -2.85675048828125, -2.729034423828125, -2.601318359375, -2.473602294921875, -2.34588623046875, -2.218170166015625, -2.0904541015625, -1.962738037109375, -1.83502197265625, -1.707305908203125, -1.57958984375, -1.451873779296875, -1.32415771484375, -1.196441650390625, -1.0687255859375, -0.941009521484375, -0.81329345703125, -0.685577392578125, -0.557861328125, -0.430145263671875, -0.30242919921875, -0.174713134765625, -0.0469970703125, 0.080718994140625, 0.20843505859375, 0.336151123046875, 0.4638671875, 0.591583251953125, 0.71929931640625, 0.847015380859375, 0.9747314453125, 1.102447509765625, 1.23016357421875, 1.357879638671875, 1.485595703125, 1.613311767578125, 1.74102783203125, 1.868743896484375, 1.9964599609375, 2.124176025390625, 2.25189208984375, 2.379608154296875, 2.50732421875, 2.635040283203125, 2.76275634765625, 2.890472412109375, 3.0181884765625, 3.145904541015625, 3.27362060546875, 3.401336669921875, 3.529052734375, 3.656768798828125, 3.78448486328125, 3.912200927734375, 4.0399169921875, 4.167633056640625, 4.29534912109375, 4.423065185546875, 4.55078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 6.0, 10.0, 8.0, 12.0, 25.0, 22.0, 31.0, 39.0, 60.0, 91.0, 98.0, 126.0, 158.0, 224.0, 321.0, 448.0, 586.0, 1042.0, 2130.0, 7351.0, 45317.0, 347697.0, 540621.0, 83548.0, 11938.0, 2919.0, 1215.0, 702.0, 472.0, 314.0, 241.0, 186.0, 143.0, 100.0, 77.0, 70.0, 40.0, 32.0, 33.0, 23.0, 18.0, 8.0, 11.0, 11.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.0, -26.07373046875, -25.1474609375, -24.22119140625, -23.294921875, -22.36865234375, -21.4423828125, -20.51611328125, -19.58984375, -18.66357421875, -17.7373046875, -16.81103515625, -15.884765625, -14.95849609375, -14.0322265625, -13.10595703125, -12.1796875, -11.25341796875, -10.3271484375, -9.40087890625, -8.474609375, -7.54833984375, -6.6220703125, -5.69580078125, -4.76953125, -3.84326171875, -2.9169921875, -1.99072265625, -1.064453125, -0.13818359375, 0.7880859375, 1.71435546875, 2.640625, 3.56689453125, 4.4931640625, 5.41943359375, 6.345703125, 7.27197265625, 8.1982421875, 9.12451171875, 10.05078125, 10.97705078125, 11.9033203125, 12.82958984375, 13.755859375, 14.68212890625, 15.6083984375, 16.53466796875, 17.4609375, 18.38720703125, 19.3134765625, 20.23974609375, 21.166015625, 22.09228515625, 23.0185546875, 23.94482421875, 24.87109375, 25.79736328125, 26.7236328125, 27.64990234375, 28.576171875, 29.50244140625, 30.4287109375, 31.35498046875, 32.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 23.0, 9.0, 22.0, 27.0, 27.0, 35.0, 46.0, 38.0, 42.0, 50.0, 66.0, 58.0, 53.0, 56.0, 47.0, 67.0, 64.0, 45.0, 36.0, 31.0, 33.0, 28.0, 24.0, 17.0, 9.0, 12.0, 10.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.75, -25.01025390625, -24.2705078125, -23.53076171875, -22.791015625, -22.05126953125, -21.3115234375, -20.57177734375, -19.83203125, -19.09228515625, -18.3525390625, -17.61279296875, -16.873046875, -16.13330078125, -15.3935546875, -14.65380859375, -13.9140625, -13.17431640625, -12.4345703125, -11.69482421875, -10.955078125, -10.21533203125, -9.4755859375, -8.73583984375, -7.99609375, -7.25634765625, -6.5166015625, -5.77685546875, -5.037109375, -4.29736328125, -3.5576171875, -2.81787109375, -2.078125, -1.33837890625, -0.5986328125, 0.14111328125, 0.880859375, 1.62060546875, 2.3603515625, 3.10009765625, 3.83984375, 4.57958984375, 5.3193359375, 6.05908203125, 6.798828125, 7.53857421875, 8.2783203125, 9.01806640625, 9.7578125, 10.49755859375, 11.2373046875, 11.97705078125, 12.716796875, 13.45654296875, 14.1962890625, 14.93603515625, 15.67578125, 16.41552734375, 17.1552734375, 17.89501953125, 18.634765625, 19.37451171875, 20.1142578125, 20.85400390625, 21.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 14.0, 26.0, 46.0, 59.0, 90.0, 128.0, 261.0, 439.0, 850.0, 1679.0, 3776.0, 10965.0, 38648.0, 163986.0, 467383.0, 267621.0, 65540.0, 16848.0, 5444.0, 2209.0, 1117.0, 558.0, 321.0, 190.0, 121.0, 74.0, 43.0, 27.0, 25.0, 7.0, 12.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.140625, -9.8564453125, -9.572265625, -9.2880859375, -9.00390625, -8.7197265625, -8.435546875, -8.1513671875, -7.8671875, -7.5830078125, -7.298828125, -7.0146484375, -6.73046875, -6.4462890625, -6.162109375, -5.8779296875, -5.59375, -5.3095703125, -5.025390625, -4.7412109375, -4.45703125, -4.1728515625, -3.888671875, -3.6044921875, -3.3203125, -3.0361328125, -2.751953125, -2.4677734375, -2.18359375, -1.8994140625, -1.615234375, -1.3310546875, -1.046875, -0.7626953125, -0.478515625, -0.1943359375, 0.08984375, 0.3740234375, 0.658203125, 0.9423828125, 1.2265625, 1.5107421875, 1.794921875, 2.0791015625, 2.36328125, 2.6474609375, 2.931640625, 3.2158203125, 3.5, 3.7841796875, 4.068359375, 4.3525390625, 4.63671875, 4.9208984375, 5.205078125, 5.4892578125, 5.7734375, 6.0576171875, 6.341796875, 6.6259765625, 6.91015625, 7.1943359375, 7.478515625, 7.7626953125, 8.046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 19.0, 26.0, 29.0, 40.0, 71.0, 66.0, 91.0, 104.0, 108.0, 93.0, 83.0, 56.0, 59.0, 31.0, 31.0, 25.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002105712890625, -0.002047628164291382, -0.0019895434379577637, -0.0019314587116241455, -0.0018733739852905273, -0.0018152892589569092, -0.001757204532623291, -0.0016991198062896729, -0.0016410350799560547, -0.0015829503536224365, -0.0015248656272888184, -0.0014667809009552002, -0.001408696174621582, -0.0013506114482879639, -0.0012925267219543457, -0.0012344419956207275, -0.0011763572692871094, -0.0011182725429534912, -0.001060187816619873, -0.0010021030902862549, -0.0009440183639526367, -0.0008859336376190186, -0.0008278489112854004, -0.0007697641849517822, -0.0007116794586181641, -0.0006535947322845459, -0.0005955100059509277, -0.0005374252796173096, -0.0004793405532836914, -0.00042125582695007324, -0.0003631711006164551, -0.0003050863742828369, -0.00024700164794921875, -0.00018891692161560059, -0.00013083219528198242, -7.274746894836426e-05, -1.4662742614746094e-05, 4.342198371887207e-05, 0.00010150671005249023, 0.0001595914363861084, 0.00021767616271972656, 0.0002757608890533447, 0.0003338456153869629, 0.00039193034172058105, 0.0004500150680541992, 0.0005080997943878174, 0.0005661845207214355, 0.0006242692470550537, 0.0006823539733886719, 0.00074043869972229, 0.0007985234260559082, 0.0008566081523895264, 0.0009146928787231445, 0.0009727776050567627, 0.0010308623313903809, 0.001088947057723999, 0.0011470317840576172, 0.0012051165103912354, 0.0012632012367248535, 0.0013212859630584717, 0.0013793706893920898, 0.001437455415725708, 0.0014955401420593262, 0.0015536248683929443, 0.0016117095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 8.0, 5.0, 8.0, 13.0, 24.0, 27.0, 34.0, 52.0, 78.0, 110.0, 223.0, 378.0, 854.0, 2113.0, 9537.0, 125627.0, 767934.0, 127877.0, 9627.0, 2170.0, 796.0, 446.0, 234.0, 149.0, 69.0, 59.0, 25.0, 16.0, 15.0, 18.0, 9.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.790283203125, -16.22119140625, -15.652099609375, -15.0830078125, -14.513916015625, -13.94482421875, -13.375732421875, -12.806640625, -12.237548828125, -11.66845703125, -11.099365234375, -10.5302734375, -9.961181640625, -9.39208984375, -8.822998046875, -8.25390625, -7.684814453125, -7.11572265625, -6.546630859375, -5.9775390625, -5.408447265625, -4.83935546875, -4.270263671875, -3.701171875, -3.132080078125, -2.56298828125, -1.993896484375, -1.4248046875, -0.855712890625, -0.28662109375, 0.282470703125, 0.8515625, 1.420654296875, 1.98974609375, 2.558837890625, 3.1279296875, 3.697021484375, 4.26611328125, 4.835205078125, 5.404296875, 5.973388671875, 6.54248046875, 7.111572265625, 7.6806640625, 8.249755859375, 8.81884765625, 9.387939453125, 9.95703125, 10.526123046875, 11.09521484375, 11.664306640625, 12.2333984375, 12.802490234375, 13.37158203125, 13.940673828125, 14.509765625, 15.078857421875, 15.64794921875, 16.217041015625, 16.7861328125, 17.355224609375, 17.92431640625, 18.493408203125, 19.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 11.0, 11.0, 15.0, 29.0, 35.0, 54.0, 62.0, 91.0, 74.0, 117.0, 84.0, 82.0, 68.0, 49.0, 46.0, 33.0, 18.0, 26.0, 13.0, 9.0, 7.0, 7.0, 9.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4296875, -9.126220703125, -8.82275390625, -8.519287109375, -8.2158203125, -7.912353515625, -7.60888671875, -7.305419921875, -7.001953125, -6.698486328125, -6.39501953125, -6.091552734375, -5.7880859375, -5.484619140625, -5.18115234375, -4.877685546875, -4.57421875, -4.270751953125, -3.96728515625, -3.663818359375, -3.3603515625, -3.056884765625, -2.75341796875, -2.449951171875, -2.146484375, -1.843017578125, -1.53955078125, -1.236083984375, -0.9326171875, -0.629150390625, -0.32568359375, -0.022216796875, 0.28125, 0.584716796875, 0.88818359375, 1.191650390625, 1.4951171875, 1.798583984375, 2.10205078125, 2.405517578125, 2.708984375, 3.012451171875, 3.31591796875, 3.619384765625, 3.9228515625, 4.226318359375, 4.52978515625, 4.833251953125, 5.13671875, 5.440185546875, 5.74365234375, 6.047119140625, 6.3505859375, 6.654052734375, 6.95751953125, 7.260986328125, 7.564453125, 7.867919921875, 8.17138671875, 8.474853515625, 8.7783203125, 9.081787109375, 9.38525390625, 9.688720703125, 9.9921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 10.0, 32.0, 42.0, 82.0, 103.0, 142.0, 161.0, 163.0, 116.0, 77.0, 34.0, 22.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-240.88356018066406, -234.98587036132812, -229.08819580078125, -223.1905059814453, -217.29281616210938, -211.3951416015625, -205.49745178222656, -199.59976196289062, -193.70208740234375, -187.8043975830078, -181.90672302246094, -176.009033203125, -170.11134338378906, -164.21365356445312, -158.31597900390625, -152.4182891845703, -146.52059936523438, -140.62290954589844, -134.72523498535156, -128.82754516601562, -122.92985534667969, -117.03217315673828, -111.13449096679688, -105.23680114746094, -99.33911895751953, -93.44143676757812, -87.54374694824219, -81.64606475830078, -75.74838256835938, -69.85069274902344, -63.95301055908203, -58.05532455444336, -52.15763854980469, -46.259952545166016, -40.362266540527344, -34.46458435058594, -28.566898345947266, -22.669212341308594, -16.771530151367188, -10.873844146728516, -4.976158142089844, 0.9215269088745117, 6.819211959838867, 12.716896057128906, 18.614582061767578, 24.51226806640625, 30.409950256347656, 36.30763626098633, 42.205322265625, 48.10300827026367, 54.000694274902344, 59.89837646484375, 65.79606628417969, 71.6937484741211, 77.5914306640625, 83.48912048339844, 89.38680267333984, 95.28448486328125, 101.18217468261719, 107.0798568725586, 112.9775390625, 118.87522888183594, 124.77291107177734, 130.67059326171875, 136.5682830810547]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 16.0, 8.0, 19.0, 20.0, 21.0, 33.0, 41.0, 39.0, 28.0, 34.0, 34.0, 43.0, 38.0, 48.0, 37.0, 40.0, 42.0, 49.0, 40.0, 38.0, 33.0, 37.0, 26.0, 25.0, 22.0, 26.0, 24.0, 22.0, 20.0, 16.0, 16.0, 11.0, 2.0, 6.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.13624572753906, -86.36341094970703, -83.59058380126953, -80.8177490234375, -78.04491424560547, -75.27207946777344, -72.49925231933594, -69.7264175415039, -66.95358276367188, -64.18074798583984, -61.40791702270508, -58.63508605957031, -55.86225128173828, -53.089420318603516, -50.31658935546875, -47.54375457763672, -44.77092361450195, -41.99809265136719, -39.225257873535156, -36.45242691040039, -33.67959213256836, -30.906761169433594, -28.133928298950195, -25.361095428466797, -22.5882625579834, -19.8154296875, -17.0425968170166, -14.26976490020752, -11.496932029724121, -8.724099159240723, -5.951267242431641, -3.178434371948242, -0.40560150146484375, 2.3672311305999756, 5.140063762664795, 7.912896156311035, 10.685729026794434, 13.458561897277832, 16.231393814086914, 19.004226684570312, 21.77705955505371, 24.54989242553711, 27.322725296020508, 30.095558166503906, 32.86838912963867, 35.6412239074707, 38.41405487060547, 41.1868896484375, 43.959720611572266, 46.73255157470703, 49.50538635253906, 52.27821731567383, 55.05105209350586, 57.823883056640625, 60.596717834472656, 63.36954879760742, 66.14237976074219, 68.91521453857422, 71.68804168701172, 74.46087646484375, 77.23371124267578, 80.00654602050781, 82.77937316894531, 85.55220794677734, 88.32504272460938]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 11.0, 10.0, 24.0, 22.0, 41.0, 76.0, 132.0, 242.0, 457.0, 1119.0, 3500.0, 16445.0, 741719.0, 3407528.0, 17047.0, 3650.0, 1150.0, 509.0, 238.0, 138.0, 76.0, 35.0, 36.0, 18.0, 20.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.97021484375, -49.3779296875, -47.78564453125, -46.193359375, -44.60107421875, -43.0087890625, -41.41650390625, -39.82421875, -38.23193359375, -36.6396484375, -35.04736328125, -33.455078125, -31.86279296875, -30.2705078125, -28.67822265625, -27.0859375, -25.49365234375, -23.9013671875, -22.30908203125, -20.716796875, -19.12451171875, -17.5322265625, -15.93994140625, -14.34765625, -12.75537109375, -11.1630859375, -9.57080078125, -7.978515625, -6.38623046875, -4.7939453125, -3.20166015625, -1.609375, -0.01708984375, 1.5751953125, 3.16748046875, 4.759765625, 6.35205078125, 7.9443359375, 9.53662109375, 11.12890625, 12.72119140625, 14.3134765625, 15.90576171875, 17.498046875, 19.09033203125, 20.6826171875, 22.27490234375, 23.8671875, 25.45947265625, 27.0517578125, 28.64404296875, 30.236328125, 31.82861328125, 33.4208984375, 35.01318359375, 36.60546875, 38.19775390625, 39.7900390625, 41.38232421875, 42.974609375, 44.56689453125, 46.1591796875, 47.75146484375, 49.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 18.0, 23.0, 21.0, 22.0, 29.0, 35.0, 34.0, 46.0, 42.0, 53.0, 41.0, 60.0, 51.0, 42.0, 44.0, 33.0, 40.0, 48.0, 38.0, 39.0, 35.0, 34.0, 27.0, 27.0, 14.0, 12.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.783935546875, -3.64990234375, -3.515869140625, -3.3818359375, -3.247802734375, -3.11376953125, -2.979736328125, -2.845703125, -2.711669921875, -2.57763671875, -2.443603515625, -2.3095703125, -2.175537109375, -2.04150390625, -1.907470703125, -1.7734375, -1.639404296875, -1.50537109375, -1.371337890625, -1.2373046875, -1.103271484375, -0.96923828125, -0.835205078125, -0.701171875, -0.567138671875, -0.43310546875, -0.299072265625, -0.1650390625, -0.031005859375, 0.10302734375, 0.237060546875, 0.37109375, 0.505126953125, 0.63916015625, 0.773193359375, 0.9072265625, 1.041259765625, 1.17529296875, 1.309326171875, 1.443359375, 1.577392578125, 1.71142578125, 1.845458984375, 1.9794921875, 2.113525390625, 2.24755859375, 2.381591796875, 2.515625, 2.649658203125, 2.78369140625, 2.917724609375, 3.0517578125, 3.185791015625, 3.31982421875, 3.453857421875, 3.587890625, 3.721923828125, 3.85595703125, 3.989990234375, 4.1240234375, 4.258056640625, 4.39208984375, 4.526123046875, 4.66015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 16.0, 12.0, 13.0, 17.0, 26.0, 34.0, 38.0, 85.0, 114.0, 161.0, 208.0, 327.0, 454.0, 746.0, 1208.0, 2242.0, 4430.0, 9498.0, 26059.0, 104286.0, 3612036.0, 352300.0, 49885.0, 15682.0, 6571.0, 3183.0, 1684.0, 986.0, 642.0, 410.0, 274.0, 181.0, 134.0, 107.0, 70.0, 42.0, 48.0, 17.0, 15.0, 7.0, 15.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.5484619140625, -13.042236328125, -12.5360107421875, -12.02978515625, -11.5235595703125, -11.017333984375, -10.5111083984375, -10.0048828125, -9.4986572265625, -8.992431640625, -8.4862060546875, -7.97998046875, -7.4737548828125, -6.967529296875, -6.4613037109375, -5.955078125, -5.4488525390625, -4.942626953125, -4.4364013671875, -3.93017578125, -3.4239501953125, -2.917724609375, -2.4114990234375, -1.9052734375, -1.3990478515625, -0.892822265625, -0.3865966796875, 0.11962890625, 0.6258544921875, 1.132080078125, 1.6383056640625, 2.14453125, 2.6507568359375, 3.156982421875, 3.6632080078125, 4.16943359375, 4.6756591796875, 5.181884765625, 5.6881103515625, 6.1943359375, 6.7005615234375, 7.206787109375, 7.7130126953125, 8.21923828125, 8.7254638671875, 9.231689453125, 9.7379150390625, 10.244140625, 10.7503662109375, 11.256591796875, 11.7628173828125, 12.26904296875, 12.7752685546875, 13.281494140625, 13.7877197265625, 14.2939453125, 14.8001708984375, 15.306396484375, 15.8126220703125, 16.31884765625, 16.8250732421875, 17.331298828125, 17.8375244140625, 18.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 12.0, 15.0, 30.0, 30.0, 69.0, 130.0, 267.0, 2630.0, 468.0, 170.0, 66.0, 49.0, 29.0, 18.0, 8.0, 13.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.156341552734375, -4.04315185546875, -3.929962158203125, -3.8167724609375, -3.703582763671875, -3.59039306640625, -3.477203369140625, -3.364013671875, -3.250823974609375, -3.13763427734375, -3.024444580078125, -2.9112548828125, -2.798065185546875, -2.68487548828125, -2.571685791015625, -2.45849609375, -2.345306396484375, -2.23211669921875, -2.118927001953125, -2.0057373046875, -1.892547607421875, -1.77935791015625, -1.666168212890625, -1.552978515625, -1.439788818359375, -1.32659912109375, -1.213409423828125, -1.1002197265625, -0.987030029296875, -0.87384033203125, -0.760650634765625, -0.6474609375, -0.534271240234375, -0.42108154296875, -0.307891845703125, -0.1947021484375, -0.081512451171875, 0.03167724609375, 0.144866943359375, 0.258056640625, 0.371246337890625, 0.48443603515625, 0.597625732421875, 0.7108154296875, 0.824005126953125, 0.93719482421875, 1.050384521484375, 1.16357421875, 1.276763916015625, 1.38995361328125, 1.503143310546875, 1.6163330078125, 1.729522705078125, 1.84271240234375, 1.955902099609375, 2.069091796875, 2.182281494140625, 2.29547119140625, 2.408660888671875, 2.5218505859375, 2.635040283203125, 2.74822998046875, 2.861419677734375, 2.974609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 9.0, 11.0, 11.0, 19.0, 16.0, 28.0, 28.0, 31.0, 50.0, 67.0, 72.0, 82.0, 72.0, 73.0, 79.0, 80.0, 65.0, 50.0, 39.0, 30.0, 28.0, 21.0, 13.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.861871719360352, -11.460796356201172, -11.059720993041992, -10.658645629882812, -10.257570266723633, -9.856494903564453, -9.45542049407959, -9.05434513092041, -8.65326976776123, -8.25219440460205, -7.851119041442871, -7.45004415512085, -7.04896879196167, -6.64789342880249, -6.246818542480469, -5.845743179321289, -5.444667816162109, -5.04359245300293, -4.64251708984375, -4.2414422035217285, -3.840366840362549, -3.439291477203369, -3.0382163524627686, -2.637141227722168, -2.2360658645629883, -1.8349906206130981, -1.433915376663208, -1.0328401327133179, -0.6317648887634277, -0.23068952560424805, 0.17038559913635254, 0.5714607238769531, 0.9725360870361328, 1.373611330986023, 1.774686574935913, 2.1757616996765137, 2.5768370628356934, 2.977912425994873, 3.3789875507354736, 3.780062675476074, 4.181138038635254, 4.582213401794434, 4.983288764953613, 5.384363651275635, 5.7854390144348145, 6.186514377593994, 6.587589263916016, 6.988664627075195, 7.389739990234375, 7.790815353393555, 8.191890716552734, 8.592966079711914, 8.994041442871094, 9.395116806030273, 9.796191215515137, 10.197266578674316, 10.598341941833496, 10.999417304992676, 11.400492668151855, 11.801568031311035, 12.202642440795898, 12.603717803955078, 13.004793167114258, 13.405868530273438, 13.806943893432617]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 4.0, 5.0, 5.0, 9.0, 10.0, 7.0, 16.0, 16.0, 29.0, 27.0, 24.0, 34.0, 39.0, 37.0, 39.0, 31.0, 46.0, 48.0, 37.0, 56.0, 45.0, 53.0, 52.0, 54.0, 41.0, 39.0, 32.0, 24.0, 31.0, 26.0, 10.0, 10.0, 8.0, 15.0, 9.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.728302955627441, -8.423388481140137, -8.118474006652832, -7.813559055328369, -7.5086445808410645, -7.20373010635376, -6.898815155029297, -6.593900680541992, -6.2889862060546875, -5.984071731567383, -5.679157257080078, -5.374242305755615, -5.0693278312683105, -4.764413356781006, -4.459498405456543, -4.154583930969238, -3.8496694564819336, -3.544754981994629, -3.239840269088745, -2.9349255561828613, -2.6300110816955566, -2.325096607208252, -2.020181894302368, -1.7152671813964844, -1.4103527069091797, -1.1054381132125854, -0.8005235195159912, -0.495608925819397, -0.19069433212280273, 0.1142202615737915, 0.41913485527038574, 0.7240495681762695, 1.0289630889892578, 1.333877682685852, 1.6387922763824463, 1.9437068700790405, 2.2486214637756348, 2.5535359382629395, 2.8584506511688232, 3.163365364074707, 3.4682798385620117, 3.7731943130493164, 4.078108787536621, 4.383023738861084, 4.687938213348389, 4.992852687835693, 5.297767639160156, 5.602682113647461, 5.907596588134766, 6.21251106262207, 6.517425537109375, 6.822340488433838, 7.127254962921143, 7.432169437408447, 7.73708438873291, 8.041998863220215, 8.34691333770752, 8.651827812194824, 8.956742286682129, 9.261656761169434, 9.566572189331055, 9.87148666381836, 10.176401138305664, 10.481315612792969, 10.786230087280273]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 13.0, 12.0, 18.0, 32.0, 39.0, 58.0, 103.0, 136.0, 213.0, 411.0, 654.0, 1123.0, 2011.0, 4014.0, 7756.0, 16571.0, 35815.0, 77533.0, 153954.0, 239985.0, 231307.0, 142797.0, 70560.0, 32981.0, 15201.0, 7037.0, 3635.0, 1935.0, 1070.0, 608.0, 316.0, 229.0, 139.0, 89.0, 66.0, 45.0, 23.0, 17.0, 12.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3551025390625, -10.975830078125, -10.5965576171875, -10.21728515625, -9.8380126953125, -9.458740234375, -9.0794677734375, -8.7001953125, -8.3209228515625, -7.941650390625, -7.5623779296875, -7.18310546875, -6.8038330078125, -6.424560546875, -6.0452880859375, -5.666015625, -5.2867431640625, -4.907470703125, -4.5281982421875, -4.14892578125, -3.7696533203125, -3.390380859375, -3.0111083984375, -2.6318359375, -2.2525634765625, -1.873291015625, -1.4940185546875, -1.11474609375, -0.7354736328125, -0.356201171875, 0.0230712890625, 0.40234375, 0.7816162109375, 1.160888671875, 1.5401611328125, 1.91943359375, 2.2987060546875, 2.677978515625, 3.0572509765625, 3.4365234375, 3.8157958984375, 4.195068359375, 4.5743408203125, 4.95361328125, 5.3328857421875, 5.712158203125, 6.0914306640625, 6.470703125, 6.8499755859375, 7.229248046875, 7.6085205078125, 7.98779296875, 8.3670654296875, 8.746337890625, 9.1256103515625, 9.5048828125, 9.8841552734375, 10.263427734375, 10.6427001953125, 11.02197265625, 11.4012451171875, 11.780517578125, 12.1597900390625, 12.5390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 7.0, 6.0, 10.0, 14.0, 19.0, 23.0, 19.0, 26.0, 16.0, 41.0, 37.0, 41.0, 47.0, 46.0, 46.0, 44.0, 53.0, 35.0, 48.0, 52.0, 38.0, 41.0, 36.0, 41.0, 29.0, 37.0, 29.0, 28.0, 19.0, 11.0, 7.0, 10.0, 5.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27239990234375, -4.1307373046875, -3.98907470703125, -3.847412109375, -3.70574951171875, -3.5640869140625, -3.42242431640625, -3.28076171875, -3.13909912109375, -2.9974365234375, -2.85577392578125, -2.714111328125, -2.57244873046875, -2.4307861328125, -2.28912353515625, -2.1474609375, -2.00579833984375, -1.8641357421875, -1.72247314453125, -1.580810546875, -1.43914794921875, -1.2974853515625, -1.15582275390625, -1.01416015625, -0.87249755859375, -0.7308349609375, -0.58917236328125, -0.447509765625, -0.30584716796875, -0.1641845703125, -0.02252197265625, 0.119140625, 0.26080322265625, 0.4024658203125, 0.54412841796875, 0.685791015625, 0.82745361328125, 0.9691162109375, 1.11077880859375, 1.25244140625, 1.39410400390625, 1.5357666015625, 1.67742919921875, 1.819091796875, 1.96075439453125, 2.1024169921875, 2.24407958984375, 2.3857421875, 2.52740478515625, 2.6690673828125, 2.81072998046875, 2.952392578125, 3.09405517578125, 3.2357177734375, 3.37738037109375, 3.51904296875, 3.66070556640625, 3.8023681640625, 3.94403076171875, 4.085693359375, 4.22735595703125, 4.3690185546875, 4.51068115234375, 4.65234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 8.0, 22.0, 13.0, 18.0, 30.0, 50.0, 65.0, 73.0, 107.0, 140.0, 214.0, 240.0, 319.0, 509.0, 792.0, 1201.0, 2366.0, 9063.0, 74688.0, 631130.0, 290679.0, 27531.0, 4454.0, 1621.0, 881.0, 638.0, 458.0, 334.0, 233.0, 163.0, 134.0, 89.0, 71.0, 54.0, 33.0, 29.0, 27.0, 15.0, 13.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.96875, -28.027587890625, -27.08642578125, -26.145263671875, -25.2041015625, -24.262939453125, -23.32177734375, -22.380615234375, -21.439453125, -20.498291015625, -19.55712890625, -18.615966796875, -17.6748046875, -16.733642578125, -15.79248046875, -14.851318359375, -13.91015625, -12.968994140625, -12.02783203125, -11.086669921875, -10.1455078125, -9.204345703125, -8.26318359375, -7.322021484375, -6.380859375, -5.439697265625, -4.49853515625, -3.557373046875, -2.6162109375, -1.675048828125, -0.73388671875, 0.207275390625, 1.1484375, 2.089599609375, 3.03076171875, 3.971923828125, 4.9130859375, 5.854248046875, 6.79541015625, 7.736572265625, 8.677734375, 9.618896484375, 10.56005859375, 11.501220703125, 12.4423828125, 13.383544921875, 14.32470703125, 15.265869140625, 16.20703125, 17.148193359375, 18.08935546875, 19.030517578125, 19.9716796875, 20.912841796875, 21.85400390625, 22.795166015625, 23.736328125, 24.677490234375, 25.61865234375, 26.559814453125, 27.5009765625, 28.442138671875, 29.38330078125, 30.324462890625, 31.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 19.0, 16.0, 22.0, 24.0, 30.0, 45.0, 50.0, 57.0, 60.0, 65.0, 68.0, 68.0, 67.0, 56.0, 63.0, 58.0, 46.0, 26.0, 37.0, 32.0, 27.0, 21.0, 10.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.689697265625, -37.78564453125, -36.881591796875, -35.9775390625, -35.073486328125, -34.16943359375, -33.265380859375, -32.361328125, -31.457275390625, -30.55322265625, -29.649169921875, -28.7451171875, -27.841064453125, -26.93701171875, -26.032958984375, -25.12890625, -24.224853515625, -23.32080078125, -22.416748046875, -21.5126953125, -20.608642578125, -19.70458984375, -18.800537109375, -17.896484375, -16.992431640625, -16.08837890625, -15.184326171875, -14.2802734375, -13.376220703125, -12.47216796875, -11.568115234375, -10.6640625, -9.760009765625, -8.85595703125, -7.951904296875, -7.0478515625, -6.143798828125, -5.23974609375, -4.335693359375, -3.431640625, -2.527587890625, -1.62353515625, -0.719482421875, 0.1845703125, 1.088623046875, 1.99267578125, 2.896728515625, 3.80078125, 4.704833984375, 5.60888671875, 6.512939453125, 7.4169921875, 8.321044921875, 9.22509765625, 10.129150390625, 11.033203125, 11.937255859375, 12.84130859375, 13.745361328125, 14.6494140625, 15.553466796875, 16.45751953125, 17.361572265625, 18.265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 17.0, 19.0, 32.0, 30.0, 46.0, 64.0, 118.0, 172.0, 299.0, 549.0, 1125.0, 2232.0, 6220.0, 20764.0, 106445.0, 574049.0, 274360.0, 44071.0, 10883.0, 3623.0, 1571.0, 738.0, 396.0, 237.0, 146.0, 95.0, 61.0, 50.0, 38.0, 16.0, 14.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.96875, -11.56640625, -11.1640625, -10.76171875, -10.359375, -9.95703125, -9.5546875, -9.15234375, -8.75, -8.34765625, -7.9453125, -7.54296875, -7.140625, -6.73828125, -6.3359375, -5.93359375, -5.53125, -5.12890625, -4.7265625, -4.32421875, -3.921875, -3.51953125, -3.1171875, -2.71484375, -2.3125, -1.91015625, -1.5078125, -1.10546875, -0.703125, -0.30078125, 0.1015625, 0.50390625, 0.90625, 1.30859375, 1.7109375, 2.11328125, 2.515625, 2.91796875, 3.3203125, 3.72265625, 4.125, 4.52734375, 4.9296875, 5.33203125, 5.734375, 6.13671875, 6.5390625, 6.94140625, 7.34375, 7.74609375, 8.1484375, 8.55078125, 8.953125, 9.35546875, 9.7578125, 10.16015625, 10.5625, 10.96484375, 11.3671875, 11.76953125, 12.171875, 12.57421875, 12.9765625, 13.37890625, 13.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 10.0, 8.0, 20.0, 19.0, 29.0, 43.0, 52.0, 54.0, 86.0, 87.0, 106.0, 95.0, 87.0, 89.0, 53.0, 39.0, 39.0, 25.0, 10.0, 8.0, 5.0, 3.0, 2.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00232696533203125, -0.0022652000188827515, -0.002203434705734253, -0.0021416693925857544, -0.002079904079437256, -0.0020181387662887573, -0.001956373453140259, -0.0018946081399917603, -0.0018328428268432617, -0.0017710775136947632, -0.0017093122005462646, -0.0016475468873977661, -0.0015857815742492676, -0.001524016261100769, -0.0014622509479522705, -0.001400485634803772, -0.0013387203216552734, -0.001276955008506775, -0.0012151896953582764, -0.0011534243822097778, -0.0010916590690612793, -0.0010298937559127808, -0.0009681284427642822, -0.0009063631296157837, -0.0008445978164672852, -0.0007828325033187866, -0.0007210671901702881, -0.0006593018770217896, -0.000597536563873291, -0.0005357712507247925, -0.00047400593757629395, -0.0004122406244277954, -0.0003504753112792969, -0.00028870999813079834, -0.0002269446849822998, -0.00016517937183380127, -0.00010341405868530273, -4.16487455368042e-05, 2.0116567611694336e-05, 8.188188076019287e-05, 0.0001436471939086914, 0.00020541250705718994, 0.0002671778202056885, 0.000328943133354187, 0.00039070844650268555, 0.0004524737596511841, 0.0005142390727996826, 0.0005760043859481812, 0.0006377696990966797, 0.0006995350122451782, 0.0007613003253936768, 0.0008230656385421753, 0.0008848309516906738, 0.0009465962648391724, 0.001008361577987671, 0.0010701268911361694, 0.001131892204284668, 0.0011936575174331665, 0.001255422830581665, 0.0013171881437301636, 0.0013789534568786621, 0.0014407187700271606, 0.0015024840831756592, 0.0015642493963241577, 0.0016260147094726562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 14.0, 13.0, 16.0, 32.0, 55.0, 94.0, 240.0, 500.0, 1552.0, 7867.0, 184862.0, 826295.0, 22564.0, 2976.0, 817.0, 302.0, 160.0, 85.0, 39.0, 21.0, 10.0, 10.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.456298828125, -32.50634765625, -31.556396484375, -30.6064453125, -29.656494140625, -28.70654296875, -27.756591796875, -26.806640625, -25.856689453125, -24.90673828125, -23.956787109375, -23.0068359375, -22.056884765625, -21.10693359375, -20.156982421875, -19.20703125, -18.257080078125, -17.30712890625, -16.357177734375, -15.4072265625, -14.457275390625, -13.50732421875, -12.557373046875, -11.607421875, -10.657470703125, -9.70751953125, -8.757568359375, -7.8076171875, -6.857666015625, -5.90771484375, -4.957763671875, -4.0078125, -3.057861328125, -2.10791015625, -1.157958984375, -0.2080078125, 0.741943359375, 1.69189453125, 2.641845703125, 3.591796875, 4.541748046875, 5.49169921875, 6.441650390625, 7.3916015625, 8.341552734375, 9.29150390625, 10.241455078125, 11.19140625, 12.141357421875, 13.09130859375, 14.041259765625, 14.9912109375, 15.941162109375, 16.89111328125, 17.841064453125, 18.791015625, 19.740966796875, 20.69091796875, 21.640869140625, 22.5908203125, 23.540771484375, 24.49072265625, 25.440673828125, 26.390625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 11.0, 12.0, 27.0, 43.0, 59.0, 72.0, 103.0, 134.0, 131.0, 128.0, 92.0, 55.0, 44.0, 22.0, 16.0, 17.0, 15.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.78125, -13.210205078125, -12.63916015625, -12.068115234375, -11.4970703125, -10.926025390625, -10.35498046875, -9.783935546875, -9.212890625, -8.641845703125, -8.07080078125, -7.499755859375, -6.9287109375, -6.357666015625, -5.78662109375, -5.215576171875, -4.64453125, -4.073486328125, -3.50244140625, -2.931396484375, -2.3603515625, -1.789306640625, -1.21826171875, -0.647216796875, -0.076171875, 0.494873046875, 1.06591796875, 1.636962890625, 2.2080078125, 2.779052734375, 3.35009765625, 3.921142578125, 4.4921875, 5.063232421875, 5.63427734375, 6.205322265625, 6.7763671875, 7.347412109375, 7.91845703125, 8.489501953125, 9.060546875, 9.631591796875, 10.20263671875, 10.773681640625, 11.3447265625, 11.915771484375, 12.48681640625, 13.057861328125, 13.62890625, 14.199951171875, 14.77099609375, 15.342041015625, 15.9130859375, 16.484130859375, 17.05517578125, 17.626220703125, 18.197265625, 18.768310546875, 19.33935546875, 19.910400390625, 20.4814453125, 21.052490234375, 21.62353515625, 22.194580078125, 22.765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 36.0, 165.0, 378.0, 283.0, 105.0, 26.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-695.87353515625, -679.59033203125, -663.3070678710938, -647.0238647460938, -630.7406005859375, -614.4573974609375, -598.1741943359375, -581.8909301757812, -565.6077270507812, -549.3245239257812, -533.041259765625, -516.758056640625, -500.4748229980469, -484.19158935546875, -467.90838623046875, -451.6251525878906, -435.3419189453125, -419.0586853027344, -402.77545166015625, -386.49224853515625, -370.2090148925781, -353.92578125, -337.642578125, -321.3593444824219, -305.07611083984375, -288.7928771972656, -272.5096435546875, -256.2264404296875, -239.94320678710938, -223.65997314453125, -207.3767547607422, -191.09353637695312, -174.81024169921875, -158.52700805664062, -142.24378967285156, -125.96056365966797, -109.67733764648438, -93.39411163330078, -77.11088562011719, -60.827659606933594, -44.54443359375, -28.261207580566406, -11.977981567382812, 4.305244445800781, 20.588470458984375, 36.87169647216797, 53.15492248535156, 69.43814849853516, 85.72137451171875, 102.00460052490234, 118.28782653808594, 134.571044921875, 150.85427856445312, 167.13751220703125, 183.4207305908203, 199.70394897460938, 215.9871826171875, 232.27041625976562, 248.5536346435547, 264.83685302734375, 281.1200866699219, 297.4033203125, 313.6865234375, 329.9697570800781, 346.25299072265625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 4.0, 9.0, 10.0, 6.0, 15.0, 12.0, 13.0, 22.0, 16.0, 25.0, 25.0, 52.0, 29.0, 42.0, 41.0, 47.0, 45.0, 48.0, 49.0, 67.0, 34.0, 35.0, 45.0, 42.0, 41.0, 27.0, 32.0, 23.0, 16.0, 30.0, 12.0, 12.0, 13.0, 11.0, 6.0, 10.0, 9.0, 6.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-104.74134826660156, -101.6285171508789, -98.51568603515625, -95.40284729003906, -92.2900161743164, -89.17718505859375, -86.06434631347656, -82.9515151977539, -79.83868408203125, -76.7258529663086, -73.61302185058594, -70.50018310546875, -67.3873519897461, -64.27452087402344, -61.161685943603516, -58.048851013183594, -54.93601989746094, -51.82318878173828, -48.71035385131836, -45.59751892089844, -42.48468780517578, -39.371856689453125, -36.2590217590332, -33.14618682861328, -30.033355712890625, -26.920522689819336, -23.807689666748047, -20.694856643676758, -17.58202362060547, -14.46919059753418, -11.35635757446289, -8.243524551391602, -5.1306915283203125, -2.0178585052490234, 1.0949745178222656, 4.207807540893555, 7.320640563964844, 10.433473587036133, 13.546306610107422, 16.65913963317871, 19.77197265625, 22.88480567932129, 25.997638702392578, 29.110471725463867, 32.223304748535156, 35.33613586425781, 38.448970794677734, 41.561805725097656, 44.67463684082031, 47.78746795654297, 50.90030288696289, 54.01313781738281, 57.12596893310547, 60.238800048828125, 63.35163497924805, 66.46446990966797, 69.57730102539062, 72.69013214111328, 75.80296325683594, 78.91580200195312, 82.02863311767578, 85.14146423339844, 88.25430297851562, 91.36713409423828, 94.47996520996094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 9.0, 21.0, 35.0, 41.0, 60.0, 105.0, 210.0, 361.0, 784.0, 1935.0, 5577.0, 24944.0, 465784.0, 3650697.0, 32645.0, 6889.0, 2220.0, 914.0, 388.0, 244.0, 132.0, 72.0, 62.0, 46.0, 21.0, 15.0, 12.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.125, -33.02685546875, -31.9287109375, -30.83056640625, -29.732421875, -28.63427734375, -27.5361328125, -26.43798828125, -25.33984375, -24.24169921875, -23.1435546875, -22.04541015625, -20.947265625, -19.84912109375, -18.7509765625, -17.65283203125, -16.5546875, -15.45654296875, -14.3583984375, -13.26025390625, -12.162109375, -11.06396484375, -9.9658203125, -8.86767578125, -7.76953125, -6.67138671875, -5.5732421875, -4.47509765625, -3.376953125, -2.27880859375, -1.1806640625, -0.08251953125, 1.015625, 2.11376953125, 3.2119140625, 4.31005859375, 5.408203125, 6.50634765625, 7.6044921875, 8.70263671875, 9.80078125, 10.89892578125, 11.9970703125, 13.09521484375, 14.193359375, 15.29150390625, 16.3896484375, 17.48779296875, 18.5859375, 19.68408203125, 20.7822265625, 21.88037109375, 22.978515625, 24.07666015625, 25.1748046875, 26.27294921875, 27.37109375, 28.46923828125, 29.5673828125, 30.66552734375, 31.763671875, 32.86181640625, 33.9599609375, 35.05810546875, 36.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 14.0, 8.0, 14.0, 13.0, 17.0, 19.0, 31.0, 41.0, 40.0, 32.0, 40.0, 35.0, 50.0, 60.0, 51.0, 51.0, 43.0, 47.0, 43.0, 39.0, 42.0, 37.0, 35.0, 28.0, 27.0, 22.0, 18.0, 9.0, 8.0, 12.0, 14.0, 10.0, 4.0, 4.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.843414306640625, -3.70831298828125, -3.573211669921875, -3.4381103515625, -3.303009033203125, -3.16790771484375, -3.032806396484375, -2.897705078125, -2.762603759765625, -2.62750244140625, -2.492401123046875, -2.3572998046875, -2.222198486328125, -2.08709716796875, -1.951995849609375, -1.81689453125, -1.681793212890625, -1.54669189453125, -1.411590576171875, -1.2764892578125, -1.141387939453125, -1.00628662109375, -0.871185302734375, -0.736083984375, -0.600982666015625, -0.46588134765625, -0.330780029296875, -0.1956787109375, -0.060577392578125, 0.07452392578125, 0.209625244140625, 0.3447265625, 0.479827880859375, 0.61492919921875, 0.750030517578125, 0.8851318359375, 1.020233154296875, 1.15533447265625, 1.290435791015625, 1.425537109375, 1.560638427734375, 1.69573974609375, 1.830841064453125, 1.9659423828125, 2.101043701171875, 2.23614501953125, 2.371246337890625, 2.50634765625, 2.641448974609375, 2.77655029296875, 2.911651611328125, 3.0467529296875, 3.181854248046875, 3.31695556640625, 3.452056884765625, 3.587158203125, 3.722259521484375, 3.85736083984375, 3.992462158203125, 4.1275634765625, 4.262664794921875, 4.39776611328125, 4.532867431640625, 4.66796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 6.0, 17.0, 27.0, 31.0, 47.0, 65.0, 99.0, 156.0, 210.0, 277.0, 427.0, 660.0, 996.0, 1423.0, 2486.0, 4067.0, 7324.0, 15124.0, 38313.0, 141681.0, 3428633.0, 433769.0, 69858.0, 23873.0, 10347.0, 5655.0, 3080.0, 1902.0, 1228.0, 872.0, 478.0, 341.0, 217.0, 174.0, 138.0, 84.0, 60.0, 34.0, 29.0, 23.0, 13.0, 11.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.9818115234375, -11.565185546875, -11.1485595703125, -10.73193359375, -10.3153076171875, -9.898681640625, -9.4820556640625, -9.0654296875, -8.6488037109375, -8.232177734375, -7.8155517578125, -7.39892578125, -6.9822998046875, -6.565673828125, -6.1490478515625, -5.732421875, -5.3157958984375, -4.899169921875, -4.4825439453125, -4.06591796875, -3.6492919921875, -3.232666015625, -2.8160400390625, -2.3994140625, -1.9827880859375, -1.566162109375, -1.1495361328125, -0.73291015625, -0.3162841796875, 0.100341796875, 0.5169677734375, 0.93359375, 1.3502197265625, 1.766845703125, 2.1834716796875, 2.60009765625, 3.0167236328125, 3.433349609375, 3.8499755859375, 4.2666015625, 4.6832275390625, 5.099853515625, 5.5164794921875, 5.93310546875, 6.3497314453125, 6.766357421875, 7.1829833984375, 7.599609375, 8.0162353515625, 8.432861328125, 8.8494873046875, 9.26611328125, 9.6827392578125, 10.099365234375, 10.5159912109375, 10.9326171875, 11.3492431640625, 11.765869140625, 12.1824951171875, 12.59912109375, 13.0157470703125, 13.432373046875, 13.8489990234375, 14.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 11.0, 11.0, 14.0, 23.0, 39.0, 46.0, 75.0, 151.0, 323.0, 2387.0, 478.0, 199.0, 95.0, 58.0, 41.0, 26.0, 16.0, 13.0, 8.0, 10.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.01446533203125, -2.8922119140625, -2.76995849609375, -2.647705078125, -2.52545166015625, -2.4031982421875, -2.28094482421875, -2.15869140625, -2.03643798828125, -1.9141845703125, -1.79193115234375, -1.669677734375, -1.54742431640625, -1.4251708984375, -1.30291748046875, -1.1806640625, -1.05841064453125, -0.9361572265625, -0.81390380859375, -0.691650390625, -0.56939697265625, -0.4471435546875, -0.32489013671875, -0.20263671875, -0.08038330078125, 0.0418701171875, 0.16412353515625, 0.286376953125, 0.40863037109375, 0.5308837890625, 0.65313720703125, 0.775390625, 0.89764404296875, 1.0198974609375, 1.14215087890625, 1.264404296875, 1.38665771484375, 1.5089111328125, 1.63116455078125, 1.75341796875, 1.87567138671875, 1.9979248046875, 2.12017822265625, 2.242431640625, 2.36468505859375, 2.4869384765625, 2.60919189453125, 2.7314453125, 2.85369873046875, 2.9759521484375, 3.09820556640625, 3.220458984375, 3.34271240234375, 3.4649658203125, 3.58721923828125, 3.70947265625, 3.83172607421875, 3.9539794921875, 4.07623291015625, 4.198486328125, 4.32073974609375, 4.4429931640625, 4.56524658203125, 4.6875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 36.0, 125.0, 266.0, 280.0, 190.0, 66.0, 24.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.20384216308594, -31.24742317199707, -29.291004180908203, -27.334583282470703, -25.378164291381836, -23.42174530029297, -21.46532440185547, -19.5089054107666, -17.552486419677734, -15.596067428588867, -13.639647483825684, -11.6832275390625, -9.726808547973633, -7.770389556884766, -5.813969612121582, -3.8575496673583984, -1.9011306762695312, 0.05528879165649414, 2.0117082595825195, 3.968127727508545, 5.92454719543457, 7.8809661865234375, 9.837386131286621, 11.793806076049805, 13.750225067138672, 15.706644058227539, 17.663063049316406, 19.619483947753906, 21.575902938842773, 23.53232192993164, 25.48874282836914, 27.445161819458008, 29.401580810546875, 31.357999801635742, 33.31441879272461, 35.27083969116211, 37.227256774902344, 39.183677673339844, 41.140098571777344, 43.096519470214844, 45.05293655395508, 47.00935745239258, 48.96577453613281, 50.92219543457031, 52.87861633300781, 54.83503341674805, 56.79145431518555, 58.74787139892578, 60.70429229736328, 62.66071319580078, 64.61713409423828, 66.57354736328125, 68.52996826171875, 70.48638916015625, 72.44281005859375, 74.39923095703125, 76.35565185546875, 78.31207275390625, 80.26849365234375, 82.22490692138672, 84.18132781982422, 86.13774871826172, 88.09416961669922, 90.05059051513672, 92.00700378417969]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 10.0, 9.0, 19.0, 19.0, 20.0, 23.0, 21.0, 33.0, 31.0, 27.0, 37.0, 29.0, 35.0, 43.0, 42.0, 30.0, 47.0, 44.0, 46.0, 49.0, 34.0, 32.0, 22.0, 35.0, 31.0, 17.0, 38.0, 21.0, 19.0, 19.0, 13.0, 16.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.307706832885742, -10.970895767211914, -10.634084701538086, -10.297273635864258, -9.960461616516113, -9.623650550842285, -9.286839485168457, -8.950028419494629, -8.613216400146484, -8.276405334472656, -7.93959379196167, -7.602782726287842, -7.2659711837768555, -6.929160118103027, -6.592349052429199, -6.255537986755371, -5.918726921081543, -5.581915855407715, -5.2451043128967285, -4.9082932472229, -4.571481704711914, -4.234670639038086, -3.897859573364258, -3.5610482692718506, -3.2242369651794434, -2.887425661087036, -2.550614356994629, -2.213803291320801, -1.8769919872283936, -1.5401806831359863, -1.2033696174621582, -0.866558313369751, -0.5297470092773438, -0.1929357647895813, 0.14387547969818115, 0.48068666458129883, 0.817497968673706, 1.1543092727661133, 1.4911203384399414, 1.8279316425323486, 2.164742946624756, 2.501554250717163, 2.8383655548095703, 3.1751766204833984, 3.5119879245758057, 3.848799228668213, 4.185610294342041, 4.522421836853027, 4.8592329025268555, 5.196043968200684, 5.53285551071167, 5.869666576385498, 6.206478118896484, 6.5432891845703125, 6.880100250244141, 7.216911315917969, 7.553722858428955, 7.890533924102783, 8.22734546661377, 8.564156532287598, 8.900967597961426, 9.23777961730957, 9.574590682983398, 9.911401748657227, 10.248212814331055]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 16.0, 26.0, 39.0, 39.0, 73.0, 107.0, 170.0, 249.0, 385.0, 564.0, 959.0, 1681.0, 2932.0, 5498.0, 10842.0, 22879.0, 49054.0, 103132.0, 191439.0, 251251.0, 198055.0, 108452.0, 51971.0, 24042.0, 11424.0, 5673.0, 3116.0, 1691.0, 1032.0, 662.0, 348.0, 260.0, 153.0, 108.0, 79.0, 50.0, 31.0, 18.0, 5.0, 3.0, 13.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 12.0, 12.0, 16.0, 16.0, 17.0, 24.0, 23.0, 34.0, 31.0, 33.0, 38.0, 35.0, 32.0, 50.0, 55.0, 56.0, 59.0, 39.0, 38.0, 49.0, 34.0, 35.0, 37.0, 28.0, 28.0, 21.0, 16.0, 16.0, 16.0, 12.0, 16.0, 11.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.994140625, -3.856597900390625, -3.71905517578125, -3.581512451171875, -3.4439697265625, -3.306427001953125, -3.16888427734375, -3.031341552734375, -2.893798828125, -2.756256103515625, -2.61871337890625, -2.481170654296875, -2.3436279296875, -2.206085205078125, -2.06854248046875, -1.930999755859375, -1.79345703125, -1.655914306640625, -1.51837158203125, -1.380828857421875, -1.2432861328125, -1.105743408203125, -0.96820068359375, -0.830657958984375, -0.693115234375, -0.555572509765625, -0.41802978515625, -0.280487060546875, -0.1429443359375, -0.005401611328125, 0.13214111328125, 0.269683837890625, 0.4072265625, 0.544769287109375, 0.68231201171875, 0.819854736328125, 0.9573974609375, 1.094940185546875, 1.23248291015625, 1.370025634765625, 1.507568359375, 1.645111083984375, 1.78265380859375, 1.920196533203125, 2.0577392578125, 2.195281982421875, 2.33282470703125, 2.470367431640625, 2.60791015625, 2.745452880859375, 2.88299560546875, 3.020538330078125, 3.1580810546875, 3.295623779296875, 3.43316650390625, 3.570709228515625, 3.708251953125, 3.845794677734375, 3.98333740234375, 4.120880126953125, 4.2584228515625, 4.395965576171875, 4.53350830078125, 4.671051025390625, 4.80859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 16.0, 11.0, 14.0, 30.0, 29.0, 39.0, 69.0, 77.0, 107.0, 146.0, 196.0, 283.0, 333.0, 484.0, 697.0, 1107.0, 1845.0, 5059.0, 31541.0, 387526.0, 557290.0, 48966.0, 6628.0, 2050.0, 1191.0, 719.0, 532.0, 382.0, 273.0, 231.0, 174.0, 136.0, 98.0, 69.0, 58.0, 32.0, 28.0, 16.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-23.84375, -23.076904296875, -22.31005859375, -21.543212890625, -20.7763671875, -20.009521484375, -19.24267578125, -18.475830078125, -17.708984375, -16.942138671875, -16.17529296875, -15.408447265625, -14.6416015625, -13.874755859375, -13.10791015625, -12.341064453125, -11.57421875, -10.807373046875, -10.04052734375, -9.273681640625, -8.5068359375, -7.739990234375, -6.97314453125, -6.206298828125, -5.439453125, -4.672607421875, -3.90576171875, -3.138916015625, -2.3720703125, -1.605224609375, -0.83837890625, -0.071533203125, 0.6953125, 1.462158203125, 2.22900390625, 2.995849609375, 3.7626953125, 4.529541015625, 5.29638671875, 6.063232421875, 6.830078125, 7.596923828125, 8.36376953125, 9.130615234375, 9.8974609375, 10.664306640625, 11.43115234375, 12.197998046875, 12.96484375, 13.731689453125, 14.49853515625, 15.265380859375, 16.0322265625, 16.799072265625, 17.56591796875, 18.332763671875, 19.099609375, 19.866455078125, 20.63330078125, 21.400146484375, 22.1669921875, 22.933837890625, 23.70068359375, 24.467529296875, 25.234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 11.0, 14.0, 14.0, 11.0, 17.0, 17.0, 14.0, 23.0, 19.0, 24.0, 32.0, 42.0, 34.0, 32.0, 42.0, 48.0, 41.0, 49.0, 39.0, 57.0, 40.0, 44.0, 40.0, 38.0, 28.0, 37.0, 26.0, 23.0, 20.0, 16.0, 20.0, 13.0, 13.0, 7.0, 5.0, 4.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.4375, -19.834228515625, -19.23095703125, -18.627685546875, -18.0244140625, -17.421142578125, -16.81787109375, -16.214599609375, -15.611328125, -15.008056640625, -14.40478515625, -13.801513671875, -13.1982421875, -12.594970703125, -11.99169921875, -11.388427734375, -10.78515625, -10.181884765625, -9.57861328125, -8.975341796875, -8.3720703125, -7.768798828125, -7.16552734375, -6.562255859375, -5.958984375, -5.355712890625, -4.75244140625, -4.149169921875, -3.5458984375, -2.942626953125, -2.33935546875, -1.736083984375, -1.1328125, -0.529541015625, 0.07373046875, 0.677001953125, 1.2802734375, 1.883544921875, 2.48681640625, 3.090087890625, 3.693359375, 4.296630859375, 4.89990234375, 5.503173828125, 6.1064453125, 6.709716796875, 7.31298828125, 7.916259765625, 8.51953125, 9.122802734375, 9.72607421875, 10.329345703125, 10.9326171875, 11.535888671875, 12.13916015625, 12.742431640625, 13.345703125, 13.948974609375, 14.55224609375, 15.155517578125, 15.7587890625, 16.362060546875, 16.96533203125, 17.568603515625, 18.171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 18.0, 32.0, 55.0, 105.0, 183.0, 374.0, 1083.0, 7161.0, 727211.0, 306399.0, 4311.0, 865.0, 378.0, 179.0, 68.0, 44.0, 25.0, 20.0, 5.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.555419921875, -31.67333984375, -30.791259765625, -29.9091796875, -29.027099609375, -28.14501953125, -27.262939453125, -26.380859375, -25.498779296875, -24.61669921875, -23.734619140625, -22.8525390625, -21.970458984375, -21.08837890625, -20.206298828125, -19.32421875, -18.442138671875, -17.56005859375, -16.677978515625, -15.7958984375, -14.913818359375, -14.03173828125, -13.149658203125, -12.267578125, -11.385498046875, -10.50341796875, -9.621337890625, -8.7392578125, -7.857177734375, -6.97509765625, -6.093017578125, -5.2109375, -4.328857421875, -3.44677734375, -2.564697265625, -1.6826171875, -0.800537109375, 0.08154296875, 0.963623046875, 1.845703125, 2.727783203125, 3.60986328125, 4.491943359375, 5.3740234375, 6.256103515625, 7.13818359375, 8.020263671875, 8.90234375, 9.784423828125, 10.66650390625, 11.548583984375, 12.4306640625, 13.312744140625, 14.19482421875, 15.076904296875, 15.958984375, 16.841064453125, 17.72314453125, 18.605224609375, 19.4873046875, 20.369384765625, 21.25146484375, 22.133544921875, 23.015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 4.0, 8.0, 13.0, 19.0, 21.0, 40.0, 64.0, 68.0, 119.0, 119.0, 153.0, 88.0, 82.0, 62.0, 43.0, 26.0, 21.0, 12.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002300262451171875, -0.0022467374801635742, -0.0021932125091552734, -0.0021396875381469727, -0.002086162567138672, -0.002032637596130371, -0.0019791126251220703, -0.0019255876541137695, -0.0018720626831054688, -0.001818537712097168, -0.0017650127410888672, -0.0017114877700805664, -0.0016579627990722656, -0.0016044378280639648, -0.001550912857055664, -0.0014973878860473633, -0.0014438629150390625, -0.0013903379440307617, -0.001336812973022461, -0.0012832880020141602, -0.0012297630310058594, -0.0011762380599975586, -0.0011227130889892578, -0.001069188117980957, -0.0010156631469726562, -0.0009621381759643555, -0.0009086132049560547, -0.0008550882339477539, -0.0008015632629394531, -0.0007480382919311523, -0.0006945133209228516, -0.0006409883499145508, -0.00058746337890625, -0.0005339384078979492, -0.00048041343688964844, -0.00042688846588134766, -0.0003733634948730469, -0.0003198385238647461, -0.0002663135528564453, -0.00021278858184814453, -0.00015926361083984375, -0.00010573863983154297, -5.221366882324219e-05, 1.3113021850585938e-06, 5.4836273193359375e-05, 0.00010836124420166016, 0.00016188621520996094, 0.00021541118621826172, 0.0002689361572265625, 0.0003224611282348633, 0.00037598609924316406, 0.00042951107025146484, 0.0004830360412597656, 0.0005365610122680664, 0.0005900859832763672, 0.000643610954284668, 0.0006971359252929688, 0.0007506608963012695, 0.0008041858673095703, 0.0008577108383178711, 0.0009112358093261719, 0.0009647607803344727, 0.0010182857513427734, 0.0010718107223510742, 0.001125335693359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 19.0, 21.0, 40.0, 99.0, 228.0, 806.0, 5583.0, 932535.0, 106097.0, 2314.0, 447.0, 178.0, 91.0, 39.0, 19.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.625, -42.208984375, -40.79296875, -39.376953125, -37.9609375, -36.544921875, -35.12890625, -33.712890625, -32.296875, -30.880859375, -29.46484375, -28.048828125, -26.6328125, -25.216796875, -23.80078125, -22.384765625, -20.96875, -19.552734375, -18.13671875, -16.720703125, -15.3046875, -13.888671875, -12.47265625, -11.056640625, -9.640625, -8.224609375, -6.80859375, -5.392578125, -3.9765625, -2.560546875, -1.14453125, 0.271484375, 1.6875, 3.103515625, 4.51953125, 5.935546875, 7.3515625, 8.767578125, 10.18359375, 11.599609375, 13.015625, 14.431640625, 15.84765625, 17.263671875, 18.6796875, 20.095703125, 21.51171875, 22.927734375, 24.34375, 25.759765625, 27.17578125, 28.591796875, 30.0078125, 31.423828125, 32.83984375, 34.255859375, 35.671875, 37.087890625, 38.50390625, 39.919921875, 41.3359375, 42.751953125, 44.16796875, 45.583984375, 47.0]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 20.0, 25.0, 55.0, 87.0, 160.0, 209.0, 211.0, 117.0, 53.0, 27.0, 13.0, 9.0, 6.0, 5.0, 2.0, 2.0], "bins": [-41.21875, -40.4508056640625, -39.682861328125, -38.9149169921875, -38.14697265625, -37.3790283203125, -36.611083984375, -35.8431396484375, -35.0751953125, -34.3072509765625, -33.539306640625, -32.7713623046875, -32.00341796875, -31.2354736328125, -30.467529296875, -29.6995849609375, -28.931640625, -28.1636962890625, -27.395751953125, -26.6278076171875, -25.85986328125, -25.0919189453125, -24.323974609375, -23.5560302734375, -22.7880859375, -22.0201416015625, -21.252197265625, -20.4842529296875, -19.71630859375, -18.9483642578125, -18.180419921875, -17.4124755859375, -16.64453125, -15.8765869140625, -15.108642578125, -14.3406982421875, -13.57275390625, -12.8048095703125, -12.036865234375, -11.2689208984375, -10.5009765625, -9.7330322265625, -8.965087890625, -8.1971435546875, -7.42919921875, -6.6612548828125, -5.893310546875, -5.1253662109375, -4.357421875, -3.5894775390625, -2.821533203125, -2.0535888671875, -1.28564453125, -0.5177001953125, 0.250244140625, 1.0181884765625, 1.7861328125, 2.5540771484375, 3.322021484375, 4.0899658203125, 4.85791015625, 5.6258544921875, 6.393798828125, 7.1617431640625, 7.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 23.0, 112.0, 613.0, 233.0, 23.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-711.9569702148438, -688.7424926757812, -665.5280151367188, -642.3134765625, -619.0989990234375, -595.884521484375, -572.6700439453125, -549.45556640625, -526.2410888671875, -503.026611328125, -479.8121032714844, -456.5976257324219, -433.38311767578125, -410.16864013671875, -386.95416259765625, -363.73968505859375, -340.525146484375, -317.3106689453125, -294.0961608886719, -270.8816833496094, -247.6671905517578, -224.45269775390625, -201.23822021484375, -178.0237274169922, -154.80923461914062, -131.59474182128906, -108.38025665283203, -85.165771484375, -61.95127868652344, -38.736785888671875, -15.522308349609375, 7.6921844482421875, 30.9066162109375, 54.1211051940918, 77.3355941772461, 100.55007934570312, 123.76457214355469, 146.97906494140625, 170.19354248046875, 193.4080352783203, 216.62252807617188, 239.83702087402344, 263.051513671875, 286.2659912109375, 309.48046875, 332.6949768066406, 355.9094543457031, 379.12396240234375, 402.33843994140625, 425.55291748046875, 448.7674255371094, 471.9819030761719, 495.1964111328125, 518.410888671875, 541.6253662109375, 564.83984375, 588.0543212890625, 611.268798828125, 634.4832763671875, 657.69775390625, 680.9122924804688, 704.1267700195312, 727.3412475585938, 750.5557250976562, 773.770263671875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 3.0, 6.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 22.0, 23.0, 26.0, 28.0, 42.0, 41.0, 45.0, 46.0, 50.0, 52.0, 54.0, 52.0, 56.0, 44.0, 40.0, 46.0, 36.0, 34.0, 20.0, 29.0, 28.0, 18.0, 13.0, 13.0, 12.0, 5.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-121.19415283203125, -117.8420181274414, -114.48988342285156, -111.13775634765625, -107.7856216430664, -104.43348693847656, -101.08135223388672, -97.72921752929688, -94.37709045410156, -91.02495574951172, -87.67282104492188, -84.32069396972656, -80.96855926513672, -77.61642456054688, -74.26428985595703, -70.91215515136719, -67.56002044677734, -64.2078857421875, -60.85575485229492, -57.50362014770508, -54.1514892578125, -50.799354553222656, -47.44721984863281, -44.09508514404297, -40.74295425415039, -37.39081954956055, -34.03868865966797, -30.686553955078125, -27.334421157836914, -23.982288360595703, -20.63015365600586, -17.27802085876465, -13.925888061523438, -10.573755264282227, -7.221621513366699, -3.869487762451172, -0.5173549652099609, 2.83477783203125, 6.186912536621094, 9.539045333862305, 12.891178131103516, 16.243310928344727, 19.595443725585938, 22.94757843017578, 26.299711227416992, 29.651844024658203, 33.00397872924805, 36.356109619140625, 39.70824432373047, 43.06037902832031, 46.41250991821289, 49.764644622802734, 53.11677551269531, 56.468910217285156, 59.821044921875, 63.173179626464844, 66.52531433105469, 69.87744903564453, 73.22958374023438, 76.58171081542969, 79.93384552001953, 83.28598022460938, 86.63811492919922, 89.99024963378906, 93.34237670898438]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 13.0, 19.0, 35.0, 60.0, 94.0, 129.0, 197.0, 376.0, 664.0, 1215.0, 2896.0, 8312.0, 40211.0, 4025306.0, 93984.0, 13036.0, 4050.0, 1685.0, 797.0, 481.0, 254.0, 179.0, 102.0, 57.0, 43.0, 28.0, 10.0, 12.0, 10.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.271240234375, -25.35498046875, -24.438720703125, -23.5224609375, -22.606201171875, -21.68994140625, -20.773681640625, -19.857421875, -18.941162109375, -18.02490234375, -17.108642578125, -16.1923828125, -15.276123046875, -14.35986328125, -13.443603515625, -12.52734375, -11.611083984375, -10.69482421875, -9.778564453125, -8.8623046875, -7.946044921875, -7.02978515625, -6.113525390625, -5.197265625, -4.281005859375, -3.36474609375, -2.448486328125, -1.5322265625, -0.615966796875, 0.30029296875, 1.216552734375, 2.1328125, 3.049072265625, 3.96533203125, 4.881591796875, 5.7978515625, 6.714111328125, 7.63037109375, 8.546630859375, 9.462890625, 10.379150390625, 11.29541015625, 12.211669921875, 13.1279296875, 14.044189453125, 14.96044921875, 15.876708984375, 16.79296875, 17.709228515625, 18.62548828125, 19.541748046875, 20.4580078125, 21.374267578125, 22.29052734375, 23.206787109375, 24.123046875, 25.039306640625, 25.95556640625, 26.871826171875, 27.7880859375, 28.704345703125, 29.62060546875, 30.536865234375, 31.453125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 5.0, 4.0, 3.0, 13.0, 12.0, 22.0, 16.0, 30.0, 27.0, 49.0, 27.0, 48.0, 45.0, 53.0, 57.0, 69.0, 60.0, 54.0, 58.0, 40.0, 41.0, 44.0, 35.0, 34.0, 30.0, 26.0, 21.0, 13.0, 14.0, 9.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.4453125, -6.26812744140625, -6.0909423828125, -5.91375732421875, -5.736572265625, -5.55938720703125, -5.3822021484375, -5.20501708984375, -5.02783203125, -4.85064697265625, -4.6734619140625, -4.49627685546875, -4.319091796875, -4.14190673828125, -3.9647216796875, -3.78753662109375, -3.6103515625, -3.43316650390625, -3.2559814453125, -3.07879638671875, -2.901611328125, -2.72442626953125, -2.5472412109375, -2.37005615234375, -2.19287109375, -2.01568603515625, -1.8385009765625, -1.66131591796875, -1.484130859375, -1.30694580078125, -1.1297607421875, -0.95257568359375, -0.775390625, -0.59820556640625, -0.4210205078125, -0.24383544921875, -0.066650390625, 0.11053466796875, 0.2877197265625, 0.46490478515625, 0.64208984375, 0.81927490234375, 0.9964599609375, 1.17364501953125, 1.350830078125, 1.52801513671875, 1.7052001953125, 1.88238525390625, 2.0595703125, 2.23675537109375, 2.4139404296875, 2.59112548828125, 2.768310546875, 2.94549560546875, 3.1226806640625, 3.29986572265625, 3.47705078125, 3.65423583984375, 3.8314208984375, 4.00860595703125, 4.185791015625, 4.36297607421875, 4.5401611328125, 4.71734619140625, 4.89453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 16.0, 18.0, 22.0, 49.0, 48.0, 73.0, 87.0, 135.0, 174.0, 232.0, 339.0, 476.0, 742.0, 1121.0, 1824.0, 3351.0, 6936.0, 20008.0, 106971.0, 3938167.0, 82046.0, 17133.0, 6257.0, 3034.0, 1644.0, 1018.0, 716.0, 486.0, 314.0, 241.0, 159.0, 119.0, 86.0, 62.0, 51.0, 39.0, 20.0, 13.0, 13.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.970458984375, -16.39404296875, -15.817626953125, -15.2412109375, -14.664794921875, -14.08837890625, -13.511962890625, -12.935546875, -12.359130859375, -11.78271484375, -11.206298828125, -10.6298828125, -10.053466796875, -9.47705078125, -8.900634765625, -8.32421875, -7.747802734375, -7.17138671875, -6.594970703125, -6.0185546875, -5.442138671875, -4.86572265625, -4.289306640625, -3.712890625, -3.136474609375, -2.56005859375, -1.983642578125, -1.4072265625, -0.830810546875, -0.25439453125, 0.322021484375, 0.8984375, 1.474853515625, 2.05126953125, 2.627685546875, 3.2041015625, 3.780517578125, 4.35693359375, 4.933349609375, 5.509765625, 6.086181640625, 6.66259765625, 7.239013671875, 7.8154296875, 8.391845703125, 8.96826171875, 9.544677734375, 10.12109375, 10.697509765625, 11.27392578125, 11.850341796875, 12.4267578125, 13.003173828125, 13.57958984375, 14.156005859375, 14.732421875, 15.308837890625, 15.88525390625, 16.461669921875, 17.0380859375, 17.614501953125, 18.19091796875, 18.767333984375, 19.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 8.0, 7.0, 16.0, 19.0, 35.0, 79.0, 253.0, 3338.0, 169.0, 69.0, 28.0, 23.0, 9.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.578125, -5.39453125, -5.2109375, -5.02734375, -4.84375, -4.66015625, -4.4765625, -4.29296875, -4.109375, -3.92578125, -3.7421875, -3.55859375, -3.375, -3.19140625, -3.0078125, -2.82421875, -2.640625, -2.45703125, -2.2734375, -2.08984375, -1.90625, -1.72265625, -1.5390625, -1.35546875, -1.171875, -0.98828125, -0.8046875, -0.62109375, -0.4375, -0.25390625, -0.0703125, 0.11328125, 0.296875, 0.48046875, 0.6640625, 0.84765625, 1.03125, 1.21484375, 1.3984375, 1.58203125, 1.765625, 1.94921875, 2.1328125, 2.31640625, 2.5, 2.68359375, 2.8671875, 3.05078125, 3.234375, 3.41796875, 3.6015625, 3.78515625, 3.96875, 4.15234375, 4.3359375, 4.51953125, 4.703125, 4.88671875, 5.0703125, 5.25390625, 5.4375, 5.62109375, 5.8046875, 5.98828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 10.0, 35.0, 78.0, 192.0, 302.0, 229.0, 112.0, 23.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.132436752319336, -24.480453491210938, -22.828472137451172, -21.176488876342773, -19.524505615234375, -17.872522354125977, -16.220539093017578, -14.568557739257812, -12.916574478149414, -11.264591217041016, -9.612608909606934, -7.960626125335693, -6.308643341064453, -4.656660079956055, -3.0046777725219727, -1.3526954650878906, 0.2992877960205078, 1.951270580291748, 3.6032533645629883, 5.2552361488342285, 6.907218933105469, 8.559202194213867, 10.21118450164795, 11.863166809082031, 13.51515007019043, 15.167133331298828, 16.819114685058594, 18.471097946166992, 20.12308120727539, 21.77506446838379, 23.427047729492188, 25.079029083251953, 26.73101043701172, 28.382993698120117, 30.034976959228516, 31.68695831298828, 33.33894348144531, 34.99092483520508, 36.642906188964844, 38.294891357421875, 39.94687271118164, 41.598854064941406, 43.25083923339844, 44.9028205871582, 46.55480194091797, 48.206787109375, 49.858768463134766, 51.51074981689453, 53.16273498535156, 54.81471633911133, 56.46670150756836, 58.118682861328125, 59.770668029785156, 61.42264938354492, 63.07463073730469, 64.72661590576172, 66.37860107421875, 68.03058624267578, 69.68256378173828, 71.33454895019531, 72.98653411865234, 74.63851928710938, 76.29049682617188, 77.9424819946289, 79.5944595336914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 11.0, 16.0, 14.0, 12.0, 23.0, 9.0, 14.0, 16.0, 23.0, 21.0, 24.0, 22.0, 29.0, 36.0, 37.0, 45.0, 41.0, 42.0, 44.0, 38.0, 33.0, 55.0, 39.0, 35.0, 27.0, 29.0, 38.0, 32.0, 20.0, 21.0, 26.0, 14.0, 25.0, 25.0, 15.0, 12.0, 13.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.527572631835938, -11.191959381103516, -10.856346130371094, -10.520732879638672, -10.18511962890625, -9.849506378173828, -9.513893127441406, -9.178279876708984, -8.842666625976562, -8.50705337524414, -8.171440124511719, -7.835826873779297, -7.500213623046875, -7.164600372314453, -6.828987121582031, -6.493373870849609, -6.157760143280029, -5.822146892547607, -5.4865336418151855, -5.150920391082764, -4.815307140350342, -4.47969388961792, -4.14408016204834, -3.808467149734497, -3.472853899002075, -3.1372406482696533, -2.8016273975372314, -2.4660139083862305, -2.1304006576538086, -1.7947875261306763, -1.4591741561889648, -1.123560905456543, -0.7879476547241211, -0.45233437418937683, -0.11672109365463257, 0.21889221668243408, 0.554505467414856, 0.8901187181472778, 1.2257320880889893, 1.5613453388214111, 1.896958589553833, 2.232571840286255, 2.5681850910186768, 2.9037985801696777, 3.2394118309020996, 3.5750250816345215, 3.9106383323669434, 4.246251583099365, 4.581864833831787, 4.917478084564209, 5.253091335296631, 5.588704586029053, 5.924317836761475, 6.2599310874938965, 6.595544815063477, 6.931158065795898, 7.26677131652832, 7.602384567260742, 7.937997817993164, 8.273611068725586, 8.609224319458008, 8.94483757019043, 9.280450820922852, 9.616064071655273, 9.951677322387695]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 7.0, 4.0, 17.0, 21.0, 41.0, 47.0, 81.0, 160.0, 251.0, 461.0, 1019.0, 2788.0, 8815.0, 33563.0, 142130.0, 447799.0, 307244.0, 76930.0, 18460.0, 5159.0, 1854.0, 809.0, 357.0, 196.0, 108.0, 66.0, 41.0, 38.0, 31.0, 22.0, 5.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.6474609375, -14.138671875, -13.6298828125, -13.12109375, -12.6123046875, -12.103515625, -11.5947265625, -11.0859375, -10.5771484375, -10.068359375, -9.5595703125, -9.05078125, -8.5419921875, -8.033203125, -7.5244140625, -7.015625, -6.5068359375, -5.998046875, -5.4892578125, -4.98046875, -4.4716796875, -3.962890625, -3.4541015625, -2.9453125, -2.4365234375, -1.927734375, -1.4189453125, -0.91015625, -0.4013671875, 0.107421875, 0.6162109375, 1.125, 1.6337890625, 2.142578125, 2.6513671875, 3.16015625, 3.6689453125, 4.177734375, 4.6865234375, 5.1953125, 5.7041015625, 6.212890625, 6.7216796875, 7.23046875, 7.7392578125, 8.248046875, 8.7568359375, 9.265625, 9.7744140625, 10.283203125, 10.7919921875, 11.30078125, 11.8095703125, 12.318359375, 12.8271484375, 13.3359375, 13.8447265625, 14.353515625, 14.8623046875, 15.37109375, 15.8798828125, 16.388671875, 16.8974609375, 17.40625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 3.0, 7.0, 13.0, 6.0, 19.0, 19.0, 33.0, 37.0, 30.0, 42.0, 33.0, 45.0, 61.0, 47.0, 55.0, 59.0, 57.0, 48.0, 45.0, 37.0, 45.0, 43.0, 33.0, 23.0, 33.0, 18.0, 22.0, 15.0, 16.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-6.5546875, -6.37615966796875, -6.1976318359375, -6.01910400390625, -5.840576171875, -5.66204833984375, -5.4835205078125, -5.30499267578125, -5.12646484375, -4.94793701171875, -4.7694091796875, -4.59088134765625, -4.412353515625, -4.23382568359375, -4.0552978515625, -3.87677001953125, -3.6982421875, -3.51971435546875, -3.3411865234375, -3.16265869140625, -2.984130859375, -2.80560302734375, -2.6270751953125, -2.44854736328125, -2.27001953125, -2.09149169921875, -1.9129638671875, -1.73443603515625, -1.555908203125, -1.37738037109375, -1.1988525390625, -1.02032470703125, -0.841796875, -0.66326904296875, -0.4847412109375, -0.30621337890625, -0.127685546875, 0.05084228515625, 0.2293701171875, 0.40789794921875, 0.58642578125, 0.76495361328125, 0.9434814453125, 1.12200927734375, 1.300537109375, 1.47906494140625, 1.6575927734375, 1.83612060546875, 2.0146484375, 2.19317626953125, 2.3717041015625, 2.55023193359375, 2.728759765625, 2.90728759765625, 3.0858154296875, 3.26434326171875, 3.44287109375, 3.62139892578125, 3.7999267578125, 3.97845458984375, 4.156982421875, 4.33551025390625, 4.5140380859375, 4.69256591796875, 4.87109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 10.0, 16.0, 17.0, 19.0, 42.0, 52.0, 79.0, 117.0, 161.0, 216.0, 286.0, 452.0, 664.0, 1201.0, 2790.0, 13694.0, 189636.0, 769256.0, 58729.0, 6528.0, 1866.0, 899.0, 590.0, 357.0, 252.0, 162.0, 143.0, 89.0, 69.0, 43.0, 38.0, 25.0, 11.0, 17.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.25048828125, -20.3759765625, -19.50146484375, -18.626953125, -17.75244140625, -16.8779296875, -16.00341796875, -15.12890625, -14.25439453125, -13.3798828125, -12.50537109375, -11.630859375, -10.75634765625, -9.8818359375, -9.00732421875, -8.1328125, -7.25830078125, -6.3837890625, -5.50927734375, -4.634765625, -3.76025390625, -2.8857421875, -2.01123046875, -1.13671875, -0.26220703125, 0.6123046875, 1.48681640625, 2.361328125, 3.23583984375, 4.1103515625, 4.98486328125, 5.859375, 6.73388671875, 7.6083984375, 8.48291015625, 9.357421875, 10.23193359375, 11.1064453125, 11.98095703125, 12.85546875, 13.72998046875, 14.6044921875, 15.47900390625, 16.353515625, 17.22802734375, 18.1025390625, 18.97705078125, 19.8515625, 20.72607421875, 21.6005859375, 22.47509765625, 23.349609375, 24.22412109375, 25.0986328125, 25.97314453125, 26.84765625, 27.72216796875, 28.5966796875, 29.47119140625, 30.345703125, 31.22021484375, 32.0947265625, 32.96923828125, 33.84375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 9.0, 17.0, 14.0, 22.0, 23.0, 16.0, 28.0, 29.0, 36.0, 38.0, 44.0, 43.0, 64.0, 40.0, 46.0, 42.0, 51.0, 52.0, 44.0, 38.0, 43.0, 38.0, 25.0, 30.0, 27.0, 22.0, 14.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.515625, -22.7724609375, -22.029296875, -21.2861328125, -20.54296875, -19.7998046875, -19.056640625, -18.3134765625, -17.5703125, -16.8271484375, -16.083984375, -15.3408203125, -14.59765625, -13.8544921875, -13.111328125, -12.3681640625, -11.625, -10.8818359375, -10.138671875, -9.3955078125, -8.65234375, -7.9091796875, -7.166015625, -6.4228515625, -5.6796875, -4.9365234375, -4.193359375, -3.4501953125, -2.70703125, -1.9638671875, -1.220703125, -0.4775390625, 0.265625, 1.0087890625, 1.751953125, 2.4951171875, 3.23828125, 3.9814453125, 4.724609375, 5.4677734375, 6.2109375, 6.9541015625, 7.697265625, 8.4404296875, 9.18359375, 9.9267578125, 10.669921875, 11.4130859375, 12.15625, 12.8994140625, 13.642578125, 14.3857421875, 15.12890625, 15.8720703125, 16.615234375, 17.3583984375, 18.1015625, 18.8447265625, 19.587890625, 20.3310546875, 21.07421875, 21.8173828125, 22.560546875, 23.3037109375, 24.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 9.0, 7.0, 8.0, 9.0, 16.0, 16.0, 17.0, 20.0, 38.0, 56.0, 104.0, 185.0, 357.0, 803.0, 4056.0, 126993.0, 897667.0, 15387.0, 1637.0, 526.0, 209.0, 123.0, 79.0, 56.0, 38.0, 30.0, 14.0, 14.0, 16.0, 10.0, 4.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.484375, -24.694091796875, -23.90380859375, -23.113525390625, -22.3232421875, -21.532958984375, -20.74267578125, -19.952392578125, -19.162109375, -18.371826171875, -17.58154296875, -16.791259765625, -16.0009765625, -15.210693359375, -14.42041015625, -13.630126953125, -12.83984375, -12.049560546875, -11.25927734375, -10.468994140625, -9.6787109375, -8.888427734375, -8.09814453125, -7.307861328125, -6.517578125, -5.727294921875, -4.93701171875, -4.146728515625, -3.3564453125, -2.566162109375, -1.77587890625, -0.985595703125, -0.1953125, 0.594970703125, 1.38525390625, 2.175537109375, 2.9658203125, 3.756103515625, 4.54638671875, 5.336669921875, 6.126953125, 6.917236328125, 7.70751953125, 8.497802734375, 9.2880859375, 10.078369140625, 10.86865234375, 11.658935546875, 12.44921875, 13.239501953125, 14.02978515625, 14.820068359375, 15.6103515625, 16.400634765625, 17.19091796875, 17.981201171875, 18.771484375, 19.561767578125, 20.35205078125, 21.142333984375, 21.9326171875, 22.722900390625, 23.51318359375, 24.303466796875, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 9.0, 4.0, 3.0, 21.0, 19.0, 27.0, 24.0, 30.0, 40.0, 57.0, 71.0, 100.0, 93.0, 89.0, 75.0, 61.0, 39.0, 35.0, 31.0, 31.0, 18.0, 19.0, 13.0, 20.0, 10.0, 12.0, 1.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0012960433959960938, -0.0012586414813995361, -0.0012212395668029785, -0.001183837652206421, -0.0011464357376098633, -0.0011090338230133057, -0.001071631908416748, -0.0010342299938201904, -0.0009968280792236328, -0.0009594261646270752, -0.0009220242500305176, -0.00088462233543396, -0.0008472204208374023, -0.0008098185062408447, -0.0007724165916442871, -0.0007350146770477295, -0.0006976127624511719, -0.0006602108478546143, -0.0006228089332580566, -0.000585407018661499, -0.0005480051040649414, -0.0005106031894683838, -0.00047320127487182617, -0.00043579936027526855, -0.00039839744567871094, -0.0003609955310821533, -0.0003235936164855957, -0.0002861917018890381, -0.00024878978729248047, -0.00021138787269592285, -0.00017398595809936523, -0.00013658404350280762, -9.918212890625e-05, -6.178021430969238e-05, -2.4378299713134766e-05, 1.3023614883422852e-05, 5.042552947998047e-05, 8.782744407653809e-05, 0.0001252293586730957, 0.00016263127326965332, 0.00020003318786621094, 0.00023743510246276855, 0.00027483701705932617, 0.0003122389316558838, 0.0003496408462524414, 0.000387042760848999, 0.00042444467544555664, 0.00046184659004211426, 0.0004992485046386719, 0.0005366504192352295, 0.0005740523338317871, 0.0006114542484283447, 0.0006488561630249023, 0.00068625807762146, 0.0007236599922180176, 0.0007610619068145752, 0.0007984638214111328, 0.0008358657360076904, 0.000873267650604248, 0.0009106695652008057, 0.0009480714797973633, 0.000985473394393921, 0.0010228753089904785, 0.0010602772235870361, 0.0010976791381835938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 3.0, 10.0, 14.0, 25.0, 36.0, 46.0, 98.0, 165.0, 297.0, 562.0, 1311.0, 4644.0, 43848.0, 851379.0, 133982.0, 8484.0, 1951.0, 804.0, 367.0, 200.0, 117.0, 76.0, 36.0, 22.0, 15.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.125, -20.515625, -19.90625, -19.296875, -18.6875, -18.078125, -17.46875, -16.859375, -16.25, -15.640625, -15.03125, -14.421875, -13.8125, -13.203125, -12.59375, -11.984375, -11.375, -10.765625, -10.15625, -9.546875, -8.9375, -8.328125, -7.71875, -7.109375, -6.5, -5.890625, -5.28125, -4.671875, -4.0625, -3.453125, -2.84375, -2.234375, -1.625, -1.015625, -0.40625, 0.203125, 0.8125, 1.421875, 2.03125, 2.640625, 3.25, 3.859375, 4.46875, 5.078125, 5.6875, 6.296875, 6.90625, 7.515625, 8.125, 8.734375, 9.34375, 9.953125, 10.5625, 11.171875, 11.78125, 12.390625, 13.0, 13.609375, 14.21875, 14.828125, 15.4375, 16.046875, 16.65625, 17.265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 16.0, 27.0, 34.0, 51.0, 60.0, 123.0, 158.0, 168.0, 124.0, 78.0, 47.0, 36.0, 23.0, 16.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.053466796875, -12.51318359375, -11.972900390625, -11.4326171875, -10.892333984375, -10.35205078125, -9.811767578125, -9.271484375, -8.731201171875, -8.19091796875, -7.650634765625, -7.1103515625, -6.570068359375, -6.02978515625, -5.489501953125, -4.94921875, -4.408935546875, -3.86865234375, -3.328369140625, -2.7880859375, -2.247802734375, -1.70751953125, -1.167236328125, -0.626953125, -0.086669921875, 0.45361328125, 0.993896484375, 1.5341796875, 2.074462890625, 2.61474609375, 3.155029296875, 3.6953125, 4.235595703125, 4.77587890625, 5.316162109375, 5.8564453125, 6.396728515625, 6.93701171875, 7.477294921875, 8.017578125, 8.557861328125, 9.09814453125, 9.638427734375, 10.1787109375, 10.718994140625, 11.25927734375, 11.799560546875, 12.33984375, 12.880126953125, 13.42041015625, 13.960693359375, 14.5009765625, 15.041259765625, 15.58154296875, 16.121826171875, 16.662109375, 17.202392578125, 17.74267578125, 18.282958984375, 18.8232421875, 19.363525390625, 19.90380859375, 20.444091796875, 20.984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 42.0, 196.0, 406.0, 268.0, 63.0, 9.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-594.6671142578125, -580.3751831054688, -566.083251953125, -551.791259765625, -537.4993286132812, -523.2073974609375, -508.91546630859375, -494.6235046386719, -480.33154296875, -466.03961181640625, -451.7476501464844, -437.4557189941406, -423.16375732421875, -408.871826171875, -394.57989501953125, -380.2879333496094, -365.9960021972656, -351.7040710449219, -337.412109375, -323.12017822265625, -308.8282165527344, -294.5362854003906, -280.24432373046875, -265.952392578125, -251.6604461669922, -237.36849975585938, -223.07655334472656, -208.78460693359375, -194.49267578125, -180.20071411132812, -165.90878295898438, -151.61683654785156, -137.32485961914062, -123.03291320800781, -108.740966796875, -94.44902801513672, -80.1570816040039, -65.8651351928711, -51.57319641113281, -37.28125, -22.989303588867188, -8.697359085083008, 5.594585418701172, 19.88652801513672, 34.17847442626953, 48.470420837402344, 62.762359619140625, 77.05430603027344, 91.34625244140625, 105.63819885253906, 119.93014526367188, 134.22207641601562, 148.5140380859375, 162.80596923828125, 177.09791564941406, 191.38986206054688, 205.6818084716797, 219.9737548828125, 234.2657012939453, 248.55764770507812, 262.8495788574219, 277.14154052734375, 291.4334716796875, 305.72540283203125, 320.0173645019531]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 12.0, 16.0, 17.0, 12.0, 13.0, 25.0, 20.0, 31.0, 35.0, 24.0, 40.0, 44.0, 41.0, 38.0, 45.0, 41.0, 52.0, 50.0, 36.0, 48.0, 33.0, 43.0, 43.0, 32.0, 25.0, 23.0, 25.0, 21.0, 20.0, 13.0, 9.0, 8.0, 12.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.62222290039062, -95.3524169921875, -92.08261108398438, -88.81279754638672, -85.5429916381836, -82.27318572998047, -79.00337982177734, -75.73356628417969, -72.46376037597656, -69.19395446777344, -65.92414855957031, -62.65433883666992, -59.38452911376953, -56.114723205566406, -52.84491729736328, -49.57510757446289, -46.305301666259766, -43.03549575805664, -39.76568603515625, -36.495880126953125, -33.226070404052734, -29.95626449584961, -26.68645668029785, -23.416648864746094, -20.146841049194336, -16.877033233642578, -13.60722541809082, -10.337418556213379, -7.067610740661621, -3.7978038787841797, -0.5279960632324219, 2.741811752319336, 6.011619567871094, 9.281427383422852, 12.55123519897461, 15.82104206085205, 19.090850830078125, 22.36065673828125, 25.630464553833008, 28.900272369384766, 32.170082092285156, 35.43988800048828, 38.70969772338867, 41.9795036315918, 45.24931335449219, 48.51911926269531, 51.78892517089844, 55.05873489379883, 58.32854080200195, 61.59834671020508, 64.86815643310547, 68.1379623413086, 71.40776824951172, 74.67758178710938, 77.9473876953125, 81.21719360351562, 84.48699951171875, 87.75680541992188, 91.026611328125, 94.29642486572266, 97.56623077392578, 100.8360366821289, 104.10584259033203, 107.37565612792969, 110.64546203613281]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 13.0, 16.0, 31.0, 44.0, 73.0, 123.0, 208.0, 368.0, 684.0, 1526.0, 3486.0, 9732.0, 43435.0, 3771377.0, 324038.0, 26608.0, 7176.0, 2696.0, 1208.0, 591.0, 317.0, 203.0, 104.0, 69.0, 44.0, 31.0, 13.0, 15.0, 12.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.078125, -24.31494140625, -23.5517578125, -22.78857421875, -22.025390625, -21.26220703125, -20.4990234375, -19.73583984375, -18.97265625, -18.20947265625, -17.4462890625, -16.68310546875, -15.919921875, -15.15673828125, -14.3935546875, -13.63037109375, -12.8671875, -12.10400390625, -11.3408203125, -10.57763671875, -9.814453125, -9.05126953125, -8.2880859375, -7.52490234375, -6.76171875, -5.99853515625, -5.2353515625, -4.47216796875, -3.708984375, -2.94580078125, -2.1826171875, -1.41943359375, -0.65625, 0.10693359375, 0.8701171875, 1.63330078125, 2.396484375, 3.15966796875, 3.9228515625, 4.68603515625, 5.44921875, 6.21240234375, 6.9755859375, 7.73876953125, 8.501953125, 9.26513671875, 10.0283203125, 10.79150390625, 11.5546875, 12.31787109375, 13.0810546875, 13.84423828125, 14.607421875, 15.37060546875, 16.1337890625, 16.89697265625, 17.66015625, 18.42333984375, 19.1865234375, 19.94970703125, 20.712890625, 21.47607421875, 22.2392578125, 23.00244140625, 23.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 10.0, 14.0, 18.0, 30.0, 37.0, 53.0, 50.0, 62.0, 72.0, 74.0, 82.0, 72.0, 78.0, 65.0, 53.0, 49.0, 47.0, 26.0, 17.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.36566162109375, -7.1180419921875, -6.87042236328125, -6.622802734375, -6.37518310546875, -6.1275634765625, -5.87994384765625, -5.63232421875, -5.38470458984375, -5.1370849609375, -4.88946533203125, -4.641845703125, -4.39422607421875, -4.1466064453125, -3.89898681640625, -3.6513671875, -3.40374755859375, -3.1561279296875, -2.90850830078125, -2.660888671875, -2.41326904296875, -2.1656494140625, -1.91802978515625, -1.67041015625, -1.42279052734375, -1.1751708984375, -0.92755126953125, -0.679931640625, -0.43231201171875, -0.1846923828125, 0.06292724609375, 0.310546875, 0.55816650390625, 0.8057861328125, 1.05340576171875, 1.301025390625, 1.54864501953125, 1.7962646484375, 2.04388427734375, 2.29150390625, 2.53912353515625, 2.7867431640625, 3.03436279296875, 3.281982421875, 3.52960205078125, 3.7772216796875, 4.02484130859375, 4.2724609375, 4.52008056640625, 4.7677001953125, 5.01531982421875, 5.262939453125, 5.51055908203125, 5.7581787109375, 6.00579833984375, 6.25341796875, 6.50103759765625, 6.7486572265625, 6.99627685546875, 7.243896484375, 7.49151611328125, 7.7391357421875, 7.98675537109375, 8.234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 11.0, 12.0, 13.0, 10.0, 33.0, 37.0, 63.0, 98.0, 124.0, 202.0, 324.0, 470.0, 725.0, 1270.0, 2251.0, 4501.0, 9980.0, 27988.0, 131674.0, 3771402.0, 187312.0, 33414.0, 11329.0, 4914.0, 2395.0, 1456.0, 829.0, 488.0, 324.0, 203.0, 113.0, 89.0, 74.0, 46.0, 28.0, 25.0, 13.0, 11.0, 13.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.46142578125, -12.0400390625, -11.61865234375, -11.197265625, -10.77587890625, -10.3544921875, -9.93310546875, -9.51171875, -9.09033203125, -8.6689453125, -8.24755859375, -7.826171875, -7.40478515625, -6.9833984375, -6.56201171875, -6.140625, -5.71923828125, -5.2978515625, -4.87646484375, -4.455078125, -4.03369140625, -3.6123046875, -3.19091796875, -2.76953125, -2.34814453125, -1.9267578125, -1.50537109375, -1.083984375, -0.66259765625, -0.2412109375, 0.18017578125, 0.6015625, 1.02294921875, 1.4443359375, 1.86572265625, 2.287109375, 2.70849609375, 3.1298828125, 3.55126953125, 3.97265625, 4.39404296875, 4.8154296875, 5.23681640625, 5.658203125, 6.07958984375, 6.5009765625, 6.92236328125, 7.34375, 7.76513671875, 8.1865234375, 8.60791015625, 9.029296875, 9.45068359375, 9.8720703125, 10.29345703125, 10.71484375, 11.13623046875, 11.5576171875, 11.97900390625, 12.400390625, 12.82177734375, 13.2431640625, 13.66455078125, 14.0859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 13.0, 19.0, 28.0, 33.0, 87.0, 248.0, 2590.0, 675.0, 168.0, 63.0, 52.0, 26.0, 21.0, 14.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.76104736328125, -6.5181884765625, -6.27532958984375, -6.032470703125, -5.78961181640625, -5.5467529296875, -5.30389404296875, -5.06103515625, -4.81817626953125, -4.5753173828125, -4.33245849609375, -4.089599609375, -3.84674072265625, -3.6038818359375, -3.36102294921875, -3.1181640625, -2.87530517578125, -2.6324462890625, -2.38958740234375, -2.146728515625, -1.90386962890625, -1.6610107421875, -1.41815185546875, -1.17529296875, -0.93243408203125, -0.6895751953125, -0.44671630859375, -0.203857421875, 0.03900146484375, 0.2818603515625, 0.52471923828125, 0.767578125, 1.01043701171875, 1.2532958984375, 1.49615478515625, 1.739013671875, 1.98187255859375, 2.2247314453125, 2.46759033203125, 2.71044921875, 2.95330810546875, 3.1961669921875, 3.43902587890625, 3.681884765625, 3.92474365234375, 4.1676025390625, 4.41046142578125, 4.6533203125, 4.89617919921875, 5.1390380859375, 5.38189697265625, 5.624755859375, 5.86761474609375, 6.1104736328125, 6.35333251953125, 6.59619140625, 6.83905029296875, 7.0819091796875, 7.32476806640625, 7.567626953125, 7.81048583984375, 8.0533447265625, 8.29620361328125, 8.5390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 13.0, 23.0, 37.0, 68.0, 82.0, 101.0, 127.0, 153.0, 100.0, 101.0, 59.0, 39.0, 30.0, 21.0, 14.0, 6.0, 9.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.00275421142578, -17.037540435791016, -16.07232666015625, -15.1071138381958, -14.141900062561035, -13.17668628692627, -12.21147346496582, -11.246259689331055, -10.281045913696289, -9.315832138061523, -8.350618362426758, -7.385405540466309, -6.420191764831543, -5.454977989196777, -4.48976469039917, -3.5245513916015625, -2.559337615966797, -1.5941240787506104, -0.6289105415344238, 0.3363029956817627, 1.3015165328979492, 2.266730308532715, 3.2319436073303223, 4.19715690612793, 5.162370681762695, 6.127584457397461, 7.092797756195068, 8.058011054992676, 9.023224830627441, 9.988438606262207, 10.953651428222656, 11.918865203857422, 12.884078979492188, 13.849292755126953, 14.814506530761719, 15.779719352722168, 16.74493408203125, 17.710147857666016, 18.67535972595215, 19.640573501586914, 20.60578727722168, 21.571001052856445, 22.53621482849121, 23.501428604125977, 24.46664047241211, 25.431854248046875, 26.39706802368164, 27.362281799316406, 28.327495574951172, 29.292709350585938, 30.257923126220703, 31.22313690185547, 32.188350677490234, 33.153564453125, 34.118778228759766, 35.08399200439453, 36.04920196533203, 37.0144157409668, 37.97962951660156, 38.94484329223633, 39.910057067871094, 40.87527084350586, 41.840484619140625, 42.805694580078125, 43.770912170410156]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 9.0, 4.0, 9.0, 13.0, 23.0, 18.0, 24.0, 15.0, 33.0, 25.0, 33.0, 30.0, 37.0, 32.0, 30.0, 25.0, 40.0, 53.0, 56.0, 50.0, 42.0, 41.0, 48.0, 35.0, 29.0, 21.0, 24.0, 24.0, 24.0, 27.0, 21.0, 23.0, 13.0, 17.0, 10.0, 7.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.932306289672852, -12.515914916992188, -12.099523544311523, -11.68313217163086, -11.266739845275879, -10.850348472595215, -10.43395709991455, -10.017565727233887, -9.601173400878906, -9.184782028198242, -8.768390655517578, -8.351999282836914, -7.935606956481934, -7.5192155838012695, -7.1028242111206055, -6.686432838439941, -6.270041465759277, -5.853650093078613, -5.437258243560791, -5.020866870880127, -4.604475021362305, -4.188083648681641, -3.7716922760009766, -3.3553006649017334, -2.9389090538024902, -2.522517442703247, -2.106125831604004, -1.6897344589233398, -1.2733428478240967, -0.8569512367248535, -0.44055986404418945, -0.02416825294494629, 0.3922233581542969, 0.8086149096488953, 1.2250064611434937, 1.6413979530334473, 2.0577895641326904, 2.4741811752319336, 2.8905725479125977, 3.306964159011841, 3.723355770111084, 4.139747142791748, 4.55613899230957, 4.972530364990234, 5.388921737670898, 5.805313587188721, 6.221704959869385, 6.638096809387207, 7.054488182067871, 7.470879554748535, 7.887271404266357, 8.30366325378418, 8.720054626464844, 9.136445999145508, 9.552837371826172, 9.969228744506836, 10.3856201171875, 10.802011489868164, 11.218402862548828, 11.634794235229492, 12.051186561584473, 12.467577934265137, 12.8839693069458, 13.300360679626465, 13.716753005981445]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 10.0, 11.0, 15.0, 18.0, 20.0, 51.0, 90.0, 121.0, 244.0, 411.0, 792.0, 1816.0, 4240.0, 11600.0, 37067.0, 129310.0, 406521.0, 319418.0, 94755.0, 27179.0, 8660.0, 3298.0, 1367.0, 682.0, 372.0, 192.0, 104.0, 73.0, 42.0, 30.0, 13.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.8404541015625, -14.266845703125, -13.6932373046875, -13.11962890625, -12.5460205078125, -11.972412109375, -11.3988037109375, -10.8251953125, -10.2515869140625, -9.677978515625, -9.1043701171875, -8.53076171875, -7.9571533203125, -7.383544921875, -6.8099365234375, -6.236328125, -5.6627197265625, -5.089111328125, -4.5155029296875, -3.94189453125, -3.3682861328125, -2.794677734375, -2.2210693359375, -1.6474609375, -1.0738525390625, -0.500244140625, 0.0733642578125, 0.64697265625, 1.2205810546875, 1.794189453125, 2.3677978515625, 2.94140625, 3.5150146484375, 4.088623046875, 4.6622314453125, 5.23583984375, 5.8094482421875, 6.383056640625, 6.9566650390625, 7.5302734375, 8.1038818359375, 8.677490234375, 9.2510986328125, 9.82470703125, 10.3983154296875, 10.971923828125, 11.5455322265625, 12.119140625, 12.6927490234375, 13.266357421875, 13.8399658203125, 14.41357421875, 14.9871826171875, 15.560791015625, 16.1343994140625, 16.7080078125, 17.2816162109375, 17.855224609375, 18.4288330078125, 19.00244140625, 19.5760498046875, 20.149658203125, 20.7232666015625, 21.296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 10.0, 6.0, 17.0, 33.0, 34.0, 51.0, 47.0, 51.0, 82.0, 75.0, 80.0, 71.0, 76.0, 73.0, 59.0, 47.0, 43.0, 31.0, 31.0, 20.0, 16.0, 9.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9854736328125, -7.728759765625, -7.4720458984375, -7.21533203125, -6.9586181640625, -6.701904296875, -6.4451904296875, -6.1884765625, -5.9317626953125, -5.675048828125, -5.4183349609375, -5.16162109375, -4.9049072265625, -4.648193359375, -4.3914794921875, -4.134765625, -3.8780517578125, -3.621337890625, -3.3646240234375, -3.10791015625, -2.8511962890625, -2.594482421875, -2.3377685546875, -2.0810546875, -1.8243408203125, -1.567626953125, -1.3109130859375, -1.05419921875, -0.7974853515625, -0.540771484375, -0.2840576171875, -0.02734375, 0.2293701171875, 0.486083984375, 0.7427978515625, 0.99951171875, 1.2562255859375, 1.512939453125, 1.7696533203125, 2.0263671875, 2.2830810546875, 2.539794921875, 2.7965087890625, 3.05322265625, 3.3099365234375, 3.566650390625, 3.8233642578125, 4.080078125, 4.3367919921875, 4.593505859375, 4.8502197265625, 5.10693359375, 5.3636474609375, 5.620361328125, 5.8770751953125, 6.1337890625, 6.3905029296875, 6.647216796875, 6.9039306640625, 7.16064453125, 7.4173583984375, 7.674072265625, 7.9307861328125, 8.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 18.0, 11.0, 28.0, 41.0, 69.0, 89.0, 137.0, 285.0, 615.0, 1597.0, 7916.0, 354026.0, 669276.0, 11116.0, 1836.0, 685.0, 337.0, 200.0, 92.0, 67.0, 22.0, 26.0, 17.0, 14.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.25, -65.57177734375, -63.8935546875, -62.21533203125, -60.537109375, -58.85888671875, -57.1806640625, -55.50244140625, -53.82421875, -52.14599609375, -50.4677734375, -48.78955078125, -47.111328125, -45.43310546875, -43.7548828125, -42.07666015625, -40.3984375, -38.72021484375, -37.0419921875, -35.36376953125, -33.685546875, -32.00732421875, -30.3291015625, -28.65087890625, -26.97265625, -25.29443359375, -23.6162109375, -21.93798828125, -20.259765625, -18.58154296875, -16.9033203125, -15.22509765625, -13.546875, -11.86865234375, -10.1904296875, -8.51220703125, -6.833984375, -5.15576171875, -3.4775390625, -1.79931640625, -0.12109375, 1.55712890625, 3.2353515625, 4.91357421875, 6.591796875, 8.27001953125, 9.9482421875, 11.62646484375, 13.3046875, 14.98291015625, 16.6611328125, 18.33935546875, 20.017578125, 21.69580078125, 23.3740234375, 25.05224609375, 26.73046875, 28.40869140625, 30.0869140625, 31.76513671875, 33.443359375, 35.12158203125, 36.7998046875, 38.47802734375, 40.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 7.0, 10.0, 11.0, 15.0, 18.0, 27.0, 22.0, 45.0, 40.0, 52.0, 46.0, 58.0, 61.0, 59.0, 45.0, 62.0, 46.0, 64.0, 44.0, 47.0, 31.0, 38.0, 32.0, 18.0, 20.0, 10.0, 13.0, 8.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.390625, -24.551513671875, -23.71240234375, -22.873291015625, -22.0341796875, -21.195068359375, -20.35595703125, -19.516845703125, -18.677734375, -17.838623046875, -16.99951171875, -16.160400390625, -15.3212890625, -14.482177734375, -13.64306640625, -12.803955078125, -11.96484375, -11.125732421875, -10.28662109375, -9.447509765625, -8.6083984375, -7.769287109375, -6.93017578125, -6.091064453125, -5.251953125, -4.412841796875, -3.57373046875, -2.734619140625, -1.8955078125, -1.056396484375, -0.21728515625, 0.621826171875, 1.4609375, 2.300048828125, 3.13916015625, 3.978271484375, 4.8173828125, 5.656494140625, 6.49560546875, 7.334716796875, 8.173828125, 9.012939453125, 9.85205078125, 10.691162109375, 11.5302734375, 12.369384765625, 13.20849609375, 14.047607421875, 14.88671875, 15.725830078125, 16.56494140625, 17.404052734375, 18.2431640625, 19.082275390625, 19.92138671875, 20.760498046875, 21.599609375, 22.438720703125, 23.27783203125, 24.116943359375, 24.9560546875, 25.795166015625, 26.63427734375, 27.473388671875, 28.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 17.0, 24.0, 55.0, 95.0, 227.0, 520.0, 1627.0, 8040.0, 118375.0, 861153.0, 51678.0, 4831.0, 1169.0, 385.0, 171.0, 75.0, 42.0, 29.0, 15.0, 14.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.128173828125, -8.63134765625, -8.134521484375, -7.6376953125, -7.140869140625, -6.64404296875, -6.147216796875, -5.650390625, -5.153564453125, -4.65673828125, -4.159912109375, -3.6630859375, -3.166259765625, -2.66943359375, -2.172607421875, -1.67578125, -1.178955078125, -0.68212890625, -0.185302734375, 0.3115234375, 0.808349609375, 1.30517578125, 1.802001953125, 2.298828125, 2.795654296875, 3.29248046875, 3.789306640625, 4.2861328125, 4.782958984375, 5.27978515625, 5.776611328125, 6.2734375, 6.770263671875, 7.26708984375, 7.763916015625, 8.2607421875, 8.757568359375, 9.25439453125, 9.751220703125, 10.248046875, 10.744873046875, 11.24169921875, 11.738525390625, 12.2353515625, 12.732177734375, 13.22900390625, 13.725830078125, 14.22265625, 14.719482421875, 15.21630859375, 15.713134765625, 16.2099609375, 16.706787109375, 17.20361328125, 17.700439453125, 18.197265625, 18.694091796875, 19.19091796875, 19.687744140625, 20.1845703125, 20.681396484375, 21.17822265625, 21.675048828125, 22.171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 22.0, 25.0, 30.0, 65.0, 92.0, 168.0, 220.0, 142.0, 96.0, 50.0, 29.0, 17.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002590179443359375, -0.0024915337562561035, -0.002392888069152832, -0.0022942423820495605, -0.002195596694946289, -0.0020969510078430176, -0.001998305320739746, -0.0018996596336364746, -0.0018010139465332031, -0.0017023682594299316, -0.0016037225723266602, -0.0015050768852233887, -0.0014064311981201172, -0.0013077855110168457, -0.0012091398239135742, -0.0011104941368103027, -0.0010118484497070312, -0.0009132027626037598, -0.0008145570755004883, -0.0007159113883972168, -0.0006172657012939453, -0.0005186200141906738, -0.00041997432708740234, -0.00032132863998413086, -0.00022268295288085938, -0.0001240372657775879, -2.5391578674316406e-05, 7.325410842895508e-05, 0.00017189979553222656, 0.00027054548263549805, 0.00036919116973876953, 0.000467836856842041, 0.0005664825439453125, 0.000665128231048584, 0.0007637739181518555, 0.000862419605255127, 0.0009610652923583984, 0.00105971097946167, 0.0011583566665649414, 0.0012570023536682129, 0.0013556480407714844, 0.0014542937278747559, 0.0015529394149780273, 0.0016515851020812988, 0.0017502307891845703, 0.0018488764762878418, 0.0019475221633911133, 0.0020461678504943848, 0.0021448135375976562, 0.0022434592247009277, 0.0023421049118041992, 0.0024407505989074707, 0.002539396286010742, 0.0026380419731140137, 0.002736687660217285, 0.0028353333473205566, 0.002933979034423828, 0.0030326247215270996, 0.003131270408630371, 0.0032299160957336426, 0.003328561782836914, 0.0034272074699401855, 0.003525853157043457, 0.0036244988441467285, 0.00372314453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 0.0, 2.0, 6.0, 13.0, 16.0, 9.0, 23.0, 42.0, 50.0, 90.0, 118.0, 227.0, 410.0, 876.0, 2545.0, 12340.0, 151381.0, 808073.0, 61994.0, 6967.0, 1810.0, 711.0, 326.0, 176.0, 102.0, 70.0, 59.0, 39.0, 20.0, 12.0, 10.0, 7.0, 8.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.625, -12.1796875, -11.734375, -11.2890625, -10.84375, -10.3984375, -9.953125, -9.5078125, -9.0625, -8.6171875, -8.171875, -7.7265625, -7.28125, -6.8359375, -6.390625, -5.9453125, -5.5, -5.0546875, -4.609375, -4.1640625, -3.71875, -3.2734375, -2.828125, -2.3828125, -1.9375, -1.4921875, -1.046875, -0.6015625, -0.15625, 0.2890625, 0.734375, 1.1796875, 1.625, 2.0703125, 2.515625, 2.9609375, 3.40625, 3.8515625, 4.296875, 4.7421875, 5.1875, 5.6328125, 6.078125, 6.5234375, 6.96875, 7.4140625, 7.859375, 8.3046875, 8.75, 9.1953125, 9.640625, 10.0859375, 10.53125, 10.9765625, 11.421875, 11.8671875, 12.3125, 12.7578125, 13.203125, 13.6484375, 14.09375, 14.5390625, 14.984375, 15.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 4.0, 7.0, 14.0, 12.0, 11.0, 17.0, 27.0, 21.0, 37.0, 41.0, 42.0, 67.0, 96.0, 90.0, 103.0, 80.0, 73.0, 49.0, 41.0, 30.0, 26.0, 24.0, 17.0, 11.0, 13.0, 5.0, 9.0, 12.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.68731689453125, -5.4410400390625, -5.19476318359375, -4.948486328125, -4.70220947265625, -4.4559326171875, -4.20965576171875, -3.96337890625, -3.71710205078125, -3.4708251953125, -3.22454833984375, -2.978271484375, -2.73199462890625, -2.4857177734375, -2.23944091796875, -1.9931640625, -1.74688720703125, -1.5006103515625, -1.25433349609375, -1.008056640625, -0.76177978515625, -0.5155029296875, -0.26922607421875, -0.02294921875, 0.22332763671875, 0.4696044921875, 0.71588134765625, 0.962158203125, 1.20843505859375, 1.4547119140625, 1.70098876953125, 1.947265625, 2.19354248046875, 2.4398193359375, 2.68609619140625, 2.932373046875, 3.17864990234375, 3.4249267578125, 3.67120361328125, 3.91748046875, 4.16375732421875, 4.4100341796875, 4.65631103515625, 4.902587890625, 5.14886474609375, 5.3951416015625, 5.64141845703125, 5.8876953125, 6.13397216796875, 6.3802490234375, 6.62652587890625, 6.872802734375, 7.11907958984375, 7.3653564453125, 7.61163330078125, 7.85791015625, 8.10418701171875, 8.3504638671875, 8.59674072265625, 8.843017578125, 9.08929443359375, 9.3355712890625, 9.58184814453125, 9.828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 12.0, 16.0, 36.0, 60.0, 111.0, 159.0, 161.0, 157.0, 129.0, 74.0, 28.0, 20.0, 17.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.7603759765625, -159.92202758789062, -154.08367919921875, -148.24534606933594, -142.40699768066406, -136.5686492919922, -130.7303009033203, -124.89196014404297, -119.05361938476562, -113.21527099609375, -107.3769302368164, -101.53858184814453, -95.70024108886719, -89.86189270019531, -84.02354431152344, -78.1852035522461, -72.34685516357422, -66.50850677490234, -60.670166015625, -54.831817626953125, -48.99347686767578, -43.155128479003906, -37.3167839050293, -31.478439331054688, -25.640094757080078, -19.80175018310547, -13.963404655456543, -8.125059127807617, -2.286714553833008, 3.5516300201416016, 9.389976501464844, 15.228321075439453, 21.066665649414062, 26.905010223388672, 32.74335479736328, 38.581703186035156, 44.4200439453125, 50.258392333984375, 56.096736907958984, 61.935081481933594, 67.77342224121094, 73.61177062988281, 79.45011138916016, 85.28845977783203, 91.12680053710938, 96.96514892578125, 102.80349731445312, 108.64183807373047, 114.48018646240234, 120.31853485107422, 126.15687561035156, 131.99522399902344, 137.8335723876953, 143.67190551757812, 149.51025390625, 155.34860229492188, 161.18695068359375, 167.02529907226562, 172.8636474609375, 178.7019805908203, 184.5403289794922, 190.37867736816406, 196.21702575683594, 202.05535888671875, 207.89370727539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 17.0, 18.0, 14.0, 14.0, 15.0, 36.0, 23.0, 31.0, 33.0, 42.0, 27.0, 37.0, 61.0, 44.0, 48.0, 59.0, 39.0, 48.0, 46.0, 42.0, 31.0, 36.0, 26.0, 26.0, 21.0, 21.0, 23.0, 14.0, 8.0, 8.0, 10.0, 8.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.928466796875, -86.89380645751953, -83.85914611816406, -80.8244857788086, -77.78982543945312, -74.75516510009766, -71.72050476074219, -68.68584442138672, -65.65118408203125, -62.61652374267578, -59.58186340332031, -56.547203063964844, -53.512542724609375, -50.477882385253906, -47.44322204589844, -44.40856170654297, -41.373905181884766, -38.3392448425293, -35.30458450317383, -32.26992416381836, -29.23526382446289, -26.200603485107422, -23.165945053100586, -20.131284713745117, -17.09662437438965, -14.06196403503418, -11.027303695678711, -7.992644309997559, -4.95798397064209, -1.923323631286621, 1.1113357543945312, 4.14599609375, 7.180656433105469, 10.215316772460938, 13.249977111816406, 16.284637451171875, 19.319297790527344, 22.353958129882812, 25.38861656188965, 28.423276901245117, 31.457937240600586, 34.49259567260742, 37.52725601196289, 40.56191635131836, 43.59657669067383, 46.6312370300293, 49.665897369384766, 52.700557708740234, 55.7352180480957, 58.76987838745117, 61.80453872680664, 64.83919525146484, 67.87385559082031, 70.90851593017578, 73.94317626953125, 76.97783660888672, 80.01249694824219, 83.04715728759766, 86.08181762695312, 89.1164779663086, 92.15113830566406, 95.18579864501953, 98.220458984375, 101.25511932373047, 104.28977966308594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 9.0, 16.0, 23.0, 32.0, 41.0, 59.0, 77.0, 141.0, 210.0, 358.0, 592.0, 998.0, 1724.0, 3194.0, 6415.0, 14281.0, 36363.0, 120781.0, 807056.0, 2760203.0, 326489.0, 70209.0, 24095.0, 10104.0, 4705.0, 2523.0, 1371.0, 788.0, 488.0, 311.0, 191.0, 119.0, 86.0, 59.0, 38.0, 32.0, 20.0, 13.0, 6.0, 15.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.390625, -9.0806884765625, -8.770751953125, -8.4608154296875, -8.15087890625, -7.8409423828125, -7.531005859375, -7.2210693359375, -6.9111328125, -6.6011962890625, -6.291259765625, -5.9813232421875, -5.67138671875, -5.3614501953125, -5.051513671875, -4.7415771484375, -4.431640625, -4.1217041015625, -3.811767578125, -3.5018310546875, -3.19189453125, -2.8819580078125, -2.572021484375, -2.2620849609375, -1.9521484375, -1.6422119140625, -1.332275390625, -1.0223388671875, -0.71240234375, -0.4024658203125, -0.092529296875, 0.2174072265625, 0.52734375, 0.8372802734375, 1.147216796875, 1.4571533203125, 1.76708984375, 2.0770263671875, 2.386962890625, 2.6968994140625, 3.0068359375, 3.3167724609375, 3.626708984375, 3.9366455078125, 4.24658203125, 4.5565185546875, 4.866455078125, 5.1763916015625, 5.486328125, 5.7962646484375, 6.106201171875, 6.4161376953125, 6.72607421875, 7.0360107421875, 7.345947265625, 7.6558837890625, 7.9658203125, 8.2757568359375, 8.585693359375, 8.8956298828125, 9.20556640625, 9.5155029296875, 9.825439453125, 10.1353759765625, 10.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 12.0, 7.0, 8.0, 10.0, 20.0, 22.0, 23.0, 27.0, 31.0, 49.0, 56.0, 44.0, 52.0, 58.0, 62.0, 62.0, 69.0, 47.0, 56.0, 42.0, 35.0, 36.0, 32.0, 24.0, 29.0, 15.0, 15.0, 8.0, 10.0, 4.0, 8.0, 9.0, 7.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.88671875, -5.6990966796875, -5.511474609375, -5.3238525390625, -5.13623046875, -4.9486083984375, -4.760986328125, -4.5733642578125, -4.3857421875, -4.1981201171875, -4.010498046875, -3.8228759765625, -3.63525390625, -3.4476318359375, -3.260009765625, -3.0723876953125, -2.884765625, -2.6971435546875, -2.509521484375, -2.3218994140625, -2.13427734375, -1.9466552734375, -1.759033203125, -1.5714111328125, -1.3837890625, -1.1961669921875, -1.008544921875, -0.8209228515625, -0.63330078125, -0.4456787109375, -0.258056640625, -0.0704345703125, 0.1171875, 0.3048095703125, 0.492431640625, 0.6800537109375, 0.86767578125, 1.0552978515625, 1.242919921875, 1.4305419921875, 1.6181640625, 1.8057861328125, 1.993408203125, 2.1810302734375, 2.36865234375, 2.5562744140625, 2.743896484375, 2.9315185546875, 3.119140625, 3.3067626953125, 3.494384765625, 3.6820068359375, 3.86962890625, 4.0572509765625, 4.244873046875, 4.4324951171875, 4.6201171875, 4.8077392578125, 4.995361328125, 5.1829833984375, 5.37060546875, 5.5582275390625, 5.745849609375, 5.9334716796875, 6.12109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 8.0, 15.0, 17.0, 44.0, 53.0, 90.0, 190.0, 421.0, 1279.0, 4323.0, 18795.0, 142568.0, 3637602.0, 346968.0, 32064.0, 6854.0, 1888.0, 591.0, 237.0, 99.0, 64.0, 38.0, 15.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.517578125, -17.84765625, -17.177734375, -16.5078125, -15.837890625, -15.16796875, -14.498046875, -13.828125, -13.158203125, -12.48828125, -11.818359375, -11.1484375, -10.478515625, -9.80859375, -9.138671875, -8.46875, -7.798828125, -7.12890625, -6.458984375, -5.7890625, -5.119140625, -4.44921875, -3.779296875, -3.109375, -2.439453125, -1.76953125, -1.099609375, -0.4296875, 0.240234375, 0.91015625, 1.580078125, 2.25, 2.919921875, 3.58984375, 4.259765625, 4.9296875, 5.599609375, 6.26953125, 6.939453125, 7.609375, 8.279296875, 8.94921875, 9.619140625, 10.2890625, 10.958984375, 11.62890625, 12.298828125, 12.96875, 13.638671875, 14.30859375, 14.978515625, 15.6484375, 16.318359375, 16.98828125, 17.658203125, 18.328125, 18.998046875, 19.66796875, 20.337890625, 21.0078125, 21.677734375, 22.34765625, 23.017578125, 23.6875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 15.0, 13.0, 12.0, 27.0, 29.0, 52.0, 72.0, 123.0, 203.0, 354.0, 658.0, 875.0, 596.0, 342.0, 200.0, 141.0, 90.0, 46.0, 49.0, 29.0, 25.0, 22.0, 11.0, 13.0, 12.0, 6.0, 3.0, 9.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.5479736328125, -13.142822265625, -12.7376708984375, -12.33251953125, -11.9273681640625, -11.522216796875, -11.1170654296875, -10.7119140625, -10.3067626953125, -9.901611328125, -9.4964599609375, -9.09130859375, -8.6861572265625, -8.281005859375, -7.8758544921875, -7.470703125, -7.0655517578125, -6.660400390625, -6.2552490234375, -5.85009765625, -5.4449462890625, -5.039794921875, -4.6346435546875, -4.2294921875, -3.8243408203125, -3.419189453125, -3.0140380859375, -2.60888671875, -2.2037353515625, -1.798583984375, -1.3934326171875, -0.98828125, -0.5831298828125, -0.177978515625, 0.2271728515625, 0.63232421875, 1.0374755859375, 1.442626953125, 1.8477783203125, 2.2529296875, 2.6580810546875, 3.063232421875, 3.4683837890625, 3.87353515625, 4.2786865234375, 4.683837890625, 5.0889892578125, 5.494140625, 5.8992919921875, 6.304443359375, 6.7095947265625, 7.11474609375, 7.5198974609375, 7.925048828125, 8.3302001953125, 8.7353515625, 9.1405029296875, 9.545654296875, 9.9508056640625, 10.35595703125, 10.7611083984375, 11.166259765625, 11.5714111328125, 11.9765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 23.0, 86.0, 251.0, 318.0, 187.0, 79.0, 24.0, 14.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.29956817626953, -98.4058609008789, -89.51216125488281, -80.61845397949219, -71.72474670410156, -62.83104705810547, -53.937339782714844, -45.043636322021484, -36.149932861328125, -27.256229400634766, -18.362524032592773, -9.468818664550781, -0.5751152038574219, 8.318588256835938, 17.212295532226562, 26.105998992919922, 34.99970245361328, 43.89340591430664, 52.787109375, 61.680816650390625, 70.57452392578125, 79.46822357177734, 88.36193084716797, 97.25563049316406, 106.14933776855469, 115.04304504394531, 123.9367446899414, 132.8304443359375, 141.72415161132812, 150.61785888671875, 159.51156616210938, 168.4052734375, 177.29898071289062, 186.19268798828125, 195.08639526367188, 203.9801025390625, 212.87379455566406, 221.7675018310547, 230.6612091064453, 239.55491638183594, 248.4486083984375, 257.3423156738281, 266.23602294921875, 275.1297302246094, 284.0234375, 292.9171142578125, 301.81085205078125, 310.70452880859375, 319.5982666015625, 328.4919738769531, 337.38568115234375, 346.2793884277344, 355.173095703125, 364.0667724609375, 372.96051025390625, 381.85418701171875, 390.7478942871094, 399.6416015625, 408.5353088378906, 417.42901611328125, 426.3227233886719, 435.2164306640625, 444.110107421875, 453.0038146972656, 461.89752197265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 2.0, 9.0, 15.0, 30.0, 24.0, 29.0, 29.0, 45.0, 44.0, 43.0, 42.0, 53.0, 43.0, 65.0, 54.0, 57.0, 58.0, 48.0, 46.0, 48.0, 34.0, 36.0, 29.0, 18.0, 17.0, 16.0, 20.0, 8.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.30931091308594, -65.72479248046875, -63.14027404785156, -60.555755615234375, -57.97124099731445, -55.386722564697266, -52.80220413208008, -50.217689514160156, -47.63317108154297, -45.04865264892578, -42.464134216308594, -39.879615783691406, -37.295101165771484, -34.7105827331543, -32.12606430053711, -29.541547775268555, -26.957027435302734, -24.372509002685547, -21.787992477416992, -19.203474044799805, -16.61895751953125, -14.034439086914062, -11.449920654296875, -8.86540412902832, -6.280885696411133, -3.6963679790496826, -1.1118502616882324, 1.4726676940917969, 4.057185173034668, 6.641702651977539, 9.226221084594727, 11.810737609863281, 14.395256042480469, 16.979774475097656, 19.56429100036621, 22.1488094329834, 24.733325958251953, 27.31784439086914, 29.902362823486328, 32.48687744140625, 35.07139587402344, 37.655914306640625, 40.24043273925781, 42.824951171875, 45.40946578979492, 47.99398422241211, 50.5785026550293, 53.16301727294922, 55.74753952026367, 58.33205795288086, 60.91657638549805, 63.50109100341797, 66.08560943603516, 68.67012786865234, 71.25464630126953, 73.83916473388672, 76.4236831665039, 79.0082015991211, 81.59272003173828, 84.17723846435547, 86.76175689697266, 89.34626770019531, 91.9307861328125, 94.51530456542969, 97.09982299804688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 8.0, 8.0, 19.0, 25.0, 26.0, 33.0, 75.0, 129.0, 174.0, 277.0, 428.0, 704.0, 998.0, 1930.0, 3369.0, 6166.0, 12047.0, 24929.0, 52666.0, 121172.0, 296287.0, 299336.0, 123068.0, 53084.0, 24996.0, 12180.0, 6215.0, 3347.0, 1846.0, 1122.0, 701.0, 416.0, 276.0, 164.0, 114.0, 64.0, 41.0, 32.0, 33.0, 8.0, 14.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.428955078125, -9.09228515625, -8.755615234375, -8.4189453125, -8.082275390625, -7.74560546875, -7.408935546875, -7.072265625, -6.735595703125, -6.39892578125, -6.062255859375, -5.7255859375, -5.388916015625, -5.05224609375, -4.715576171875, -4.37890625, -4.042236328125, -3.70556640625, -3.368896484375, -3.0322265625, -2.695556640625, -2.35888671875, -2.022216796875, -1.685546875, -1.348876953125, -1.01220703125, -0.675537109375, -0.3388671875, -0.002197265625, 0.33447265625, 0.671142578125, 1.0078125, 1.344482421875, 1.68115234375, 2.017822265625, 2.3544921875, 2.691162109375, 3.02783203125, 3.364501953125, 3.701171875, 4.037841796875, 4.37451171875, 4.711181640625, 5.0478515625, 5.384521484375, 5.72119140625, 6.057861328125, 6.39453125, 6.731201171875, 7.06787109375, 7.404541015625, 7.7412109375, 8.077880859375, 8.41455078125, 8.751220703125, 9.087890625, 9.424560546875, 9.76123046875, 10.097900390625, 10.4345703125, 10.771240234375, 11.10791015625, 11.444580078125, 11.78125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 14.0, 6.0, 11.0, 19.0, 17.0, 25.0, 32.0, 30.0, 31.0, 39.0, 54.0, 43.0, 46.0, 46.0, 53.0, 53.0, 37.0, 47.0, 51.0, 44.0, 31.0, 55.0, 23.0, 36.0, 22.0, 21.0, 25.0, 20.0, 10.0, 5.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.828125, -4.65985107421875, -4.4915771484375, -4.32330322265625, -4.155029296875, -3.98675537109375, -3.8184814453125, -3.65020751953125, -3.48193359375, -3.31365966796875, -3.1453857421875, -2.97711181640625, -2.808837890625, -2.64056396484375, -2.4722900390625, -2.30401611328125, -2.1357421875, -1.96746826171875, -1.7991943359375, -1.63092041015625, -1.462646484375, -1.29437255859375, -1.1260986328125, -0.95782470703125, -0.78955078125, -0.62127685546875, -0.4530029296875, -0.28472900390625, -0.116455078125, 0.05181884765625, 0.2200927734375, 0.38836669921875, 0.556640625, 0.72491455078125, 0.8931884765625, 1.06146240234375, 1.229736328125, 1.39801025390625, 1.5662841796875, 1.73455810546875, 1.90283203125, 2.07110595703125, 2.2393798828125, 2.40765380859375, 2.575927734375, 2.74420166015625, 2.9124755859375, 3.08074951171875, 3.2490234375, 3.41729736328125, 3.5855712890625, 3.75384521484375, 3.922119140625, 4.09039306640625, 4.2586669921875, 4.42694091796875, 4.59521484375, 4.76348876953125, 4.9317626953125, 5.10003662109375, 5.268310546875, 5.43658447265625, 5.6048583984375, 5.77313232421875, 5.94140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 9.0, 8.0, 11.0, 12.0, 28.0, 36.0, 57.0, 64.0, 108.0, 185.0, 351.0, 688.0, 1750.0, 8350.0, 168364.0, 837132.0, 25841.0, 3349.0, 1076.0, 476.0, 239.0, 165.0, 71.0, 50.0, 30.0, 31.0, 19.0, 14.0, 7.0, 5.0, 9.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-43.0625, -41.68359375, -40.3046875, -38.92578125, -37.546875, -36.16796875, -34.7890625, -33.41015625, -32.03125, -30.65234375, -29.2734375, -27.89453125, -26.515625, -25.13671875, -23.7578125, -22.37890625, -21.0, -19.62109375, -18.2421875, -16.86328125, -15.484375, -14.10546875, -12.7265625, -11.34765625, -9.96875, -8.58984375, -7.2109375, -5.83203125, -4.453125, -3.07421875, -1.6953125, -0.31640625, 1.0625, 2.44140625, 3.8203125, 5.19921875, 6.578125, 7.95703125, 9.3359375, 10.71484375, 12.09375, 13.47265625, 14.8515625, 16.23046875, 17.609375, 18.98828125, 20.3671875, 21.74609375, 23.125, 24.50390625, 25.8828125, 27.26171875, 28.640625, 30.01953125, 31.3984375, 32.77734375, 34.15625, 35.53515625, 36.9140625, 38.29296875, 39.671875, 41.05078125, 42.4296875, 43.80859375, 45.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 1.0, 7.0, 8.0, 11.0, 15.0, 12.0, 16.0, 18.0, 25.0, 25.0, 23.0, 39.0, 32.0, 51.0, 50.0, 63.0, 58.0, 58.0, 63.0, 71.0, 48.0, 49.0, 47.0, 38.0, 25.0, 30.0, 25.0, 20.0, 8.0, 12.0, 15.0, 8.0, 1.0, 8.0, 0.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.09375, -23.235107421875, -22.37646484375, -21.517822265625, -20.6591796875, -19.800537109375, -18.94189453125, -18.083251953125, -17.224609375, -16.365966796875, -15.50732421875, -14.648681640625, -13.7900390625, -12.931396484375, -12.07275390625, -11.214111328125, -10.35546875, -9.496826171875, -8.63818359375, -7.779541015625, -6.9208984375, -6.062255859375, -5.20361328125, -4.344970703125, -3.486328125, -2.627685546875, -1.76904296875, -0.910400390625, -0.0517578125, 0.806884765625, 1.66552734375, 2.524169921875, 3.3828125, 4.241455078125, 5.10009765625, 5.958740234375, 6.8173828125, 7.676025390625, 8.53466796875, 9.393310546875, 10.251953125, 11.110595703125, 11.96923828125, 12.827880859375, 13.6865234375, 14.545166015625, 15.40380859375, 16.262451171875, 17.12109375, 17.979736328125, 18.83837890625, 19.697021484375, 20.5556640625, 21.414306640625, 22.27294921875, 23.131591796875, 23.990234375, 24.848876953125, 25.70751953125, 26.566162109375, 27.4248046875, 28.283447265625, 29.14208984375, 30.000732421875, 30.859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 14.0, 15.0, 29.0, 33.0, 45.0, 69.0, 109.0, 197.0, 387.0, 917.0, 2615.0, 13813.0, 205774.0, 780736.0, 36310.0, 4888.0, 1325.0, 535.0, 276.0, 126.0, 108.0, 54.0, 36.0, 26.0, 21.0, 21.0, 9.0, 5.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.1875, -12.7509765625, -12.314453125, -11.8779296875, -11.44140625, -11.0048828125, -10.568359375, -10.1318359375, -9.6953125, -9.2587890625, -8.822265625, -8.3857421875, -7.94921875, -7.5126953125, -7.076171875, -6.6396484375, -6.203125, -5.7666015625, -5.330078125, -4.8935546875, -4.45703125, -4.0205078125, -3.583984375, -3.1474609375, -2.7109375, -2.2744140625, -1.837890625, -1.4013671875, -0.96484375, -0.5283203125, -0.091796875, 0.3447265625, 0.78125, 1.2177734375, 1.654296875, 2.0908203125, 2.52734375, 2.9638671875, 3.400390625, 3.8369140625, 4.2734375, 4.7099609375, 5.146484375, 5.5830078125, 6.01953125, 6.4560546875, 6.892578125, 7.3291015625, 7.765625, 8.2021484375, 8.638671875, 9.0751953125, 9.51171875, 9.9482421875, 10.384765625, 10.8212890625, 11.2578125, 11.6943359375, 12.130859375, 12.5673828125, 13.00390625, 13.4404296875, 13.876953125, 14.3134765625, 14.75]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 12.0, 12.0, 15.0, 23.0, 23.0, 31.0, 55.0, 95.0, 136.0, 183.0, 125.0, 80.0, 59.0, 28.0, 35.0, 20.0, 21.0, 10.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00276947021484375, -0.0026991814374923706, -0.002628892660140991, -0.002558603882789612, -0.0024883151054382324, -0.002418026328086853, -0.0023477375507354736, -0.0022774487733840942, -0.002207159996032715, -0.0021368712186813354, -0.002066582441329956, -0.0019962936639785767, -0.0019260048866271973, -0.0018557161092758179, -0.0017854273319244385, -0.001715138554573059, -0.0016448497772216797, -0.0015745609998703003, -0.001504272222518921, -0.0014339834451675415, -0.0013636946678161621, -0.0012934058904647827, -0.0012231171131134033, -0.001152828335762024, -0.0010825395584106445, -0.0010122507810592651, -0.0009419620037078857, -0.0008716732263565063, -0.000801384449005127, -0.0007310956716537476, -0.0006608068943023682, -0.0005905181169509888, -0.0005202293395996094, -0.00044994056224823, -0.0003796517848968506, -0.0003093630075454712, -0.0002390742301940918, -0.0001687854528427124, -9.849667549133301e-05, -2.8207898139953613e-05, 4.208087921142578e-05, 0.00011236965656280518, 0.00018265843391418457, 0.00025294721126556396, 0.00032323598861694336, 0.00039352476596832275, 0.00046381354331970215, 0.0005341023206710815, 0.0006043910980224609, 0.0006746798753738403, 0.0007449686527252197, 0.0008152574300765991, 0.0008855462074279785, 0.0009558349847793579, 0.0010261237621307373, 0.0010964125394821167, 0.001166701316833496, 0.0012369900941848755, 0.0013072788715362549, 0.0013775676488876343, 0.0014478564262390137, 0.001518145203590393, 0.0015884339809417725, 0.0016587227582931519, 0.0017290115356445312]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 8.0, 15.0, 16.0, 9.0, 22.0, 30.0, 33.0, 82.0, 107.0, 147.0, 276.0, 480.0, 1009.0, 2084.0, 6492.0, 35878.0, 579863.0, 384504.0, 28029.0, 5598.0, 1877.0, 809.0, 420.0, 261.0, 150.0, 108.0, 60.0, 39.0, 26.0, 25.0, 18.0, 14.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.796875, -10.423828125, -10.05078125, -9.677734375, -9.3046875, -8.931640625, -8.55859375, -8.185546875, -7.8125, -7.439453125, -7.06640625, -6.693359375, -6.3203125, -5.947265625, -5.57421875, -5.201171875, -4.828125, -4.455078125, -4.08203125, -3.708984375, -3.3359375, -2.962890625, -2.58984375, -2.216796875, -1.84375, -1.470703125, -1.09765625, -0.724609375, -0.3515625, 0.021484375, 0.39453125, 0.767578125, 1.140625, 1.513671875, 1.88671875, 2.259765625, 2.6328125, 3.005859375, 3.37890625, 3.751953125, 4.125, 4.498046875, 4.87109375, 5.244140625, 5.6171875, 5.990234375, 6.36328125, 6.736328125, 7.109375, 7.482421875, 7.85546875, 8.228515625, 8.6015625, 8.974609375, 9.34765625, 9.720703125, 10.09375, 10.466796875, 10.83984375, 11.212890625, 11.5859375, 11.958984375, 12.33203125, 12.705078125, 13.078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 7.0, 2.0, 6.0, 4.0, 5.0, 5.0, 17.0, 17.0, 23.0, 21.0, 29.0, 32.0, 42.0, 69.0, 88.0, 101.0, 105.0, 79.0, 80.0, 47.0, 46.0, 42.0, 22.0, 20.0, 21.0, 13.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.51708984375, -8.2685546875, -8.02001953125, -7.771484375, -7.52294921875, -7.2744140625, -7.02587890625, -6.77734375, -6.52880859375, -6.2802734375, -6.03173828125, -5.783203125, -5.53466796875, -5.2861328125, -5.03759765625, -4.7890625, -4.54052734375, -4.2919921875, -4.04345703125, -3.794921875, -3.54638671875, -3.2978515625, -3.04931640625, -2.80078125, -2.55224609375, -2.3037109375, -2.05517578125, -1.806640625, -1.55810546875, -1.3095703125, -1.06103515625, -0.8125, -0.56396484375, -0.3154296875, -0.06689453125, 0.181640625, 0.43017578125, 0.6787109375, 0.92724609375, 1.17578125, 1.42431640625, 1.6728515625, 1.92138671875, 2.169921875, 2.41845703125, 2.6669921875, 2.91552734375, 3.1640625, 3.41259765625, 3.6611328125, 3.90966796875, 4.158203125, 4.40673828125, 4.6552734375, 4.90380859375, 5.15234375, 5.40087890625, 5.6494140625, 5.89794921875, 6.146484375, 6.39501953125, 6.6435546875, 6.89208984375, 7.140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 21.0, 72.0, 228.0, 357.0, 209.0, 64.0, 23.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.30621337890625, -214.85260009765625, -204.39898681640625, -193.94537353515625, -183.49176025390625, -173.03814697265625, -162.58453369140625, -152.13092041015625, -141.67730712890625, -131.22369384765625, -120.77008056640625, -110.31646728515625, -99.86285400390625, -89.40924072265625, -78.95561981201172, -68.50200653076172, -58.04838562011719, -47.59477233886719, -37.14115905761719, -26.687541961669922, -16.233928680419922, -5.780315399169922, 4.673301696777344, 15.126914978027344, 25.580528259277344, 36.034141540527344, 46.487754821777344, 56.94137191772461, 67.39498901367188, 77.84860229492188, 88.30221557617188, 98.75582885742188, 109.20944213867188, 119.66305541992188, 130.11666870117188, 140.57028198242188, 151.02389526367188, 161.47750854492188, 171.93112182617188, 182.38473510742188, 192.83834838867188, 203.29196166992188, 213.74557495117188, 224.19918823242188, 234.65280151367188, 245.10641479492188, 255.56002807617188, 266.0136413574219, 276.46728515625, 286.9208984375, 297.37451171875, 307.828125, 318.28173828125, 328.7353515625, 339.18896484375, 349.642578125, 360.09619140625, 370.5498046875, 381.00341796875, 391.45703125, 401.91064453125, 412.3642578125, 422.81787109375, 433.271484375, 443.72509765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 9.0, 9.0, 10.0, 15.0, 18.0, 18.0, 11.0, 23.0, 25.0, 18.0, 36.0, 29.0, 32.0, 35.0, 41.0, 54.0, 56.0, 52.0, 54.0, 57.0, 50.0, 39.0, 37.0, 30.0, 29.0, 25.0, 32.0, 27.0, 26.0, 15.0, 17.0, 17.0, 14.0, 8.0, 13.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-100.84375, -97.78082275390625, -94.7178955078125, -91.65496826171875, -88.592041015625, -85.52912139892578, -82.46619415283203, -79.40326690673828, -76.34033966064453, -73.27741241455078, -70.21448516845703, -67.15155792236328, -64.08863830566406, -61.02570724487305, -57.96278381347656, -54.89985656738281, -51.83692932128906, -48.77400207519531, -45.71107482910156, -42.64815139770508, -39.58522415161133, -36.52229690551758, -33.459373474121094, -30.396446228027344, -27.333518981933594, -24.270591735839844, -21.207666397094727, -18.14474105834961, -15.08181381225586, -12.018887519836426, -8.955961227416992, -5.893035888671875, -2.8301162719726562, 0.23281002044677734, 3.295736312866211, 6.3586626052856445, 9.421588897705078, 12.484515190124512, 15.547441482543945, 18.610366821289062, 21.673294067382812, 24.736221313476562, 27.79914665222168, 30.862071990966797, 33.92499923706055, 36.9879264831543, 40.05084991455078, 43.11377716064453, 46.17670440673828, 49.23963165283203, 52.30255889892578, 55.365482330322266, 58.428409576416016, 61.491336822509766, 64.55426025390625, 67.6171875, 70.68011474609375, 73.7430419921875, 76.80596923828125, 79.868896484375, 82.93182373046875, 85.99474334716797, 89.05767059326172, 92.12059783935547, 95.18352508544922]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 17.0, 33.0, 47.0, 75.0, 134.0, 276.0, 1533.0, 4142497.0, 48625.0, 548.0, 206.0, 109.0, 80.0, 42.0, 12.0, 14.0, 9.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9375, -85.73828125, -82.5390625, -79.33984375, -76.140625, -72.94140625, -69.7421875, -66.54296875, -63.34375, -60.14453125, -56.9453125, -53.74609375, -50.546875, -47.34765625, -44.1484375, -40.94921875, -37.75, -34.55078125, -31.3515625, -28.15234375, -24.953125, -21.75390625, -18.5546875, -15.35546875, -12.15625, -8.95703125, -5.7578125, -2.55859375, 0.640625, 3.83984375, 7.0390625, 10.23828125, 13.4375, 16.63671875, 19.8359375, 23.03515625, 26.234375, 29.43359375, 32.6328125, 35.83203125, 39.03125, 42.23046875, 45.4296875, 48.62890625, 51.828125, 55.02734375, 58.2265625, 61.42578125, 64.625, 67.82421875, 71.0234375, 74.22265625, 77.421875, 80.62109375, 83.8203125, 87.01953125, 90.21875, 93.41796875, 96.6171875, 99.81640625, 103.015625, 106.21484375, 109.4140625, 112.61328125, 115.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 14.0, 6.0, 23.0, 32.0, 27.0, 39.0, 60.0, 61.0, 71.0, 83.0, 75.0, 76.0, 73.0, 79.0, 56.0, 53.0, 40.0, 33.0, 24.0, 23.0, 14.0, 11.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.87994384765625, -7.6348876953125, -7.38983154296875, -7.144775390625, -6.89971923828125, -6.6546630859375, -6.40960693359375, -6.16455078125, -5.91949462890625, -5.6744384765625, -5.42938232421875, -5.184326171875, -4.93927001953125, -4.6942138671875, -4.44915771484375, -4.2041015625, -3.95904541015625, -3.7139892578125, -3.46893310546875, -3.223876953125, -2.97882080078125, -2.7337646484375, -2.48870849609375, -2.24365234375, -1.99859619140625, -1.7535400390625, -1.50848388671875, -1.263427734375, -1.01837158203125, -0.7733154296875, -0.52825927734375, -0.283203125, -0.03814697265625, 0.2069091796875, 0.45196533203125, 0.697021484375, 0.94207763671875, 1.1871337890625, 1.43218994140625, 1.67724609375, 1.92230224609375, 2.1673583984375, 2.41241455078125, 2.657470703125, 2.90252685546875, 3.1475830078125, 3.39263916015625, 3.6376953125, 3.88275146484375, 4.1278076171875, 4.37286376953125, 4.617919921875, 4.86297607421875, 5.1080322265625, 5.35308837890625, 5.59814453125, 5.84320068359375, 6.0882568359375, 6.33331298828125, 6.578369140625, 6.82342529296875, 7.0684814453125, 7.31353759765625, 7.55859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 8.0, 17.0, 17.0, 18.0, 61.0, 89.0, 187.0, 339.0, 746.0, 1488.0, 3316.0, 7818.0, 20905.0, 78085.0, 738732.0, 3063094.0, 213607.0, 41030.0, 13418.0, 5756.0, 2690.0, 1338.0, 704.0, 396.0, 184.0, 96.0, 52.0, 35.0, 21.0, 8.0, 5.0, 8.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.015625, -10.6517333984375, -10.287841796875, -9.9239501953125, -9.56005859375, -9.1961669921875, -8.832275390625, -8.4683837890625, -8.1044921875, -7.7406005859375, -7.376708984375, -7.0128173828125, -6.64892578125, -6.2850341796875, -5.921142578125, -5.5572509765625, -5.193359375, -4.8294677734375, -4.465576171875, -4.1016845703125, -3.73779296875, -3.3739013671875, -3.010009765625, -2.6461181640625, -2.2822265625, -1.9183349609375, -1.554443359375, -1.1905517578125, -0.82666015625, -0.4627685546875, -0.098876953125, 0.2650146484375, 0.62890625, 0.9927978515625, 1.356689453125, 1.7205810546875, 2.08447265625, 2.4483642578125, 2.812255859375, 3.1761474609375, 3.5400390625, 3.9039306640625, 4.267822265625, 4.6317138671875, 4.99560546875, 5.3594970703125, 5.723388671875, 6.0872802734375, 6.451171875, 6.8150634765625, 7.178955078125, 7.5428466796875, 7.90673828125, 8.2706298828125, 8.634521484375, 8.9984130859375, 9.3623046875, 9.7261962890625, 10.090087890625, 10.4539794921875, 10.81787109375, 11.1817626953125, 11.545654296875, 11.9095458984375, 12.2734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 12.0, 11.0, 15.0, 26.0, 24.0, 37.0, 72.0, 91.0, 142.0, 243.0, 469.0, 799.0, 800.0, 503.0, 292.0, 159.0, 98.0, 67.0, 42.0, 33.0, 24.0, 18.0, 18.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.390625, -9.0677490234375, -8.744873046875, -8.4219970703125, -8.09912109375, -7.7762451171875, -7.453369140625, -7.1304931640625, -6.8076171875, -6.4847412109375, -6.161865234375, -5.8389892578125, -5.51611328125, -5.1932373046875, -4.870361328125, -4.5474853515625, -4.224609375, -3.9017333984375, -3.578857421875, -3.2559814453125, -2.93310546875, -2.6102294921875, -2.287353515625, -1.9644775390625, -1.6416015625, -1.3187255859375, -0.995849609375, -0.6729736328125, -0.35009765625, -0.0272216796875, 0.295654296875, 0.6185302734375, 0.94140625, 1.2642822265625, 1.587158203125, 1.9100341796875, 2.23291015625, 2.5557861328125, 2.878662109375, 3.2015380859375, 3.5244140625, 3.8472900390625, 4.170166015625, 4.4930419921875, 4.81591796875, 5.1387939453125, 5.461669921875, 5.7845458984375, 6.107421875, 6.4302978515625, 6.753173828125, 7.0760498046875, 7.39892578125, 7.7218017578125, 8.044677734375, 8.3675537109375, 8.6904296875, 9.0133056640625, 9.336181640625, 9.6590576171875, 9.98193359375, 10.3048095703125, 10.627685546875, 10.9505615234375, 11.2734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 11.0, 14.0, 20.0, 48.0, 68.0, 133.0, 169.0, 163.0, 130.0, 96.0, 53.0, 27.0, 16.0, 17.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15904235839844, -59.059532165527344, -55.96002197265625, -52.860511779785156, -49.76100158691406, -46.66149139404297, -43.56197738647461, -40.462467193603516, -37.36295700073242, -34.26344680786133, -31.163936614990234, -28.064424514770508, -24.964914321899414, -21.86540412902832, -18.765892028808594, -15.6663818359375, -12.566871643066406, -9.467361450195312, -6.367850303649902, -3.268339157104492, -0.16882896423339844, 2.9306812286376953, 6.030193328857422, 9.129703521728516, 12.22921371459961, 15.328723907470703, 18.428234100341797, 21.527746200561523, 24.627256393432617, 27.72676658630371, 30.826278686523438, 33.92578887939453, 37.025299072265625, 40.12480926513672, 43.22431945800781, 46.323829650878906, 49.42333984375, 52.522850036621094, 55.62236404418945, 58.72187423706055, 61.82138442993164, 64.9208984375, 68.0204086303711, 71.11991882324219, 74.21942901611328, 77.31893920898438, 80.41844940185547, 83.51795959472656, 86.61746978759766, 89.71697998046875, 92.81649017333984, 95.91600036621094, 99.01551055908203, 102.11502075195312, 105.21453857421875, 108.31404113769531, 111.41355895996094, 114.51306915283203, 117.61257934570312, 120.71208953857422, 123.81159973144531, 126.9111099243164, 130.0106201171875, 133.11013793945312, 136.2096405029297]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 8.0, 17.0, 25.0, 37.0, 38.0, 32.0, 41.0, 38.0, 41.0, 61.0, 66.0, 68.0, 56.0, 42.0, 51.0, 45.0, 38.0, 39.0, 43.0, 40.0, 26.0, 20.0, 17.0, 19.0, 15.0, 14.0, 10.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.64141082763672, -45.89904022216797, -44.15666961669922, -42.41429901123047, -40.67192840576172, -38.92955780029297, -37.18718338012695, -35.4448127746582, -33.70244216918945, -31.960071563720703, -30.217700958251953, -28.47532844543457, -26.73295783996582, -24.99058723449707, -23.248214721679688, -21.505844116210938, -19.763473510742188, -18.021102905273438, -16.278732299804688, -14.536359786987305, -12.793989181518555, -11.051618576049805, -9.309247016906738, -7.566875457763672, -5.824504852294922, -4.082133769989014, -2.3397626876831055, -0.5973916053771973, 1.144979476928711, 2.887350082397461, 4.629721641540527, 6.372093200683594, 8.114459991455078, 9.856830596923828, 11.599202156066895, 13.341573715209961, 15.083944320678711, 16.82631492614746, 18.568687438964844, 20.311058044433594, 22.053428649902344, 23.795799255371094, 25.538169860839844, 27.280542373657227, 29.022912979125977, 30.765283584594727, 32.50765609741211, 34.25002670288086, 35.99239730834961, 37.73476791381836, 39.47713851928711, 41.21950912475586, 42.961883544921875, 44.704254150390625, 46.446624755859375, 48.188995361328125, 49.931365966796875, 51.673736572265625, 53.416107177734375, 55.158477783203125, 56.900848388671875, 58.643218994140625, 60.38559341430664, 62.12796401977539, 63.87033462524414]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 13.0, 21.0, 30.0, 44.0, 66.0, 126.0, 204.0, 342.0, 646.0, 1353.0, 2779.0, 6186.0, 14034.0, 34194.0, 91336.0, 291574.0, 396674.0, 129155.0, 46125.0, 18544.0, 8131.0, 3516.0, 1657.0, 821.0, 370.0, 251.0, 131.0, 79.0, 58.0, 24.0, 24.0, 14.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.3046875, -12.92626953125, -12.5478515625, -12.16943359375, -11.791015625, -11.41259765625, -11.0341796875, -10.65576171875, -10.27734375, -9.89892578125, -9.5205078125, -9.14208984375, -8.763671875, -8.38525390625, -8.0068359375, -7.62841796875, -7.25, -6.87158203125, -6.4931640625, -6.11474609375, -5.736328125, -5.35791015625, -4.9794921875, -4.60107421875, -4.22265625, -3.84423828125, -3.4658203125, -3.08740234375, -2.708984375, -2.33056640625, -1.9521484375, -1.57373046875, -1.1953125, -0.81689453125, -0.4384765625, -0.06005859375, 0.318359375, 0.69677734375, 1.0751953125, 1.45361328125, 1.83203125, 2.21044921875, 2.5888671875, 2.96728515625, 3.345703125, 3.72412109375, 4.1025390625, 4.48095703125, 4.859375, 5.23779296875, 5.6162109375, 5.99462890625, 6.373046875, 6.75146484375, 7.1298828125, 7.50830078125, 7.88671875, 8.26513671875, 8.6435546875, 9.02197265625, 9.400390625, 9.77880859375, 10.1572265625, 10.53564453125, 10.9140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 12.0, 9.0, 14.0, 14.0, 16.0, 27.0, 33.0, 41.0, 50.0, 54.0, 50.0, 64.0, 57.0, 78.0, 66.0, 73.0, 58.0, 61.0, 37.0, 43.0, 31.0, 27.0, 19.0, 21.0, 17.0, 12.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.87176513671875, -7.6575927734375, -7.44342041015625, -7.229248046875, -7.01507568359375, -6.8009033203125, -6.58673095703125, -6.37255859375, -6.15838623046875, -5.9442138671875, -5.73004150390625, -5.515869140625, -5.30169677734375, -5.0875244140625, -4.87335205078125, -4.6591796875, -4.44500732421875, -4.2308349609375, -4.01666259765625, -3.802490234375, -3.58831787109375, -3.3741455078125, -3.15997314453125, -2.94580078125, -2.73162841796875, -2.5174560546875, -2.30328369140625, -2.089111328125, -1.87493896484375, -1.6607666015625, -1.44659423828125, -1.232421875, -1.01824951171875, -0.8040771484375, -0.58990478515625, -0.375732421875, -0.16156005859375, 0.0526123046875, 0.26678466796875, 0.48095703125, 0.69512939453125, 0.9093017578125, 1.12347412109375, 1.337646484375, 1.55181884765625, 1.7659912109375, 1.98016357421875, 2.1943359375, 2.40850830078125, 2.6226806640625, 2.83685302734375, 3.051025390625, 3.26519775390625, 3.4793701171875, 3.69354248046875, 3.90771484375, 4.12188720703125, 4.3360595703125, 4.55023193359375, 4.764404296875, 4.97857666015625, 5.1927490234375, 5.40692138671875, 5.62109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 16.0, 28.0, 40.0, 59.0, 101.0, 174.0, 305.0, 632.0, 1518.0, 5438.0, 34976.0, 545917.0, 420516.0, 31123.0, 5023.0, 1423.0, 556.0, 274.0, 146.0, 84.0, 60.0, 42.0, 35.0, 17.0, 15.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.413818359375, -24.59326171875, -23.772705078125, -22.9521484375, -22.131591796875, -21.31103515625, -20.490478515625, -19.669921875, -18.849365234375, -18.02880859375, -17.208251953125, -16.3876953125, -15.567138671875, -14.74658203125, -13.926025390625, -13.10546875, -12.284912109375, -11.46435546875, -10.643798828125, -9.8232421875, -9.002685546875, -8.18212890625, -7.361572265625, -6.541015625, -5.720458984375, -4.89990234375, -4.079345703125, -3.2587890625, -2.438232421875, -1.61767578125, -0.797119140625, 0.0234375, 0.843994140625, 1.66455078125, 2.485107421875, 3.3056640625, 4.126220703125, 4.94677734375, 5.767333984375, 6.587890625, 7.408447265625, 8.22900390625, 9.049560546875, 9.8701171875, 10.690673828125, 11.51123046875, 12.331787109375, 13.15234375, 13.972900390625, 14.79345703125, 15.614013671875, 16.4345703125, 17.255126953125, 18.07568359375, 18.896240234375, 19.716796875, 20.537353515625, 21.35791015625, 22.178466796875, 22.9990234375, 23.819580078125, 24.64013671875, 25.460693359375, 26.28125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 13.0, 15.0, 29.0, 33.0, 30.0, 34.0, 39.0, 49.0, 46.0, 57.0, 51.0, 59.0, 55.0, 60.0, 62.0, 58.0, 28.0, 39.0, 35.0, 26.0, 28.0, 27.0, 10.0, 18.0, 12.0, 12.0, 10.0, 9.0, 5.0, 1.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.109375, -19.44091796875, -18.7724609375, -18.10400390625, -17.435546875, -16.76708984375, -16.0986328125, -15.43017578125, -14.76171875, -14.09326171875, -13.4248046875, -12.75634765625, -12.087890625, -11.41943359375, -10.7509765625, -10.08251953125, -9.4140625, -8.74560546875, -8.0771484375, -7.40869140625, -6.740234375, -6.07177734375, -5.4033203125, -4.73486328125, -4.06640625, -3.39794921875, -2.7294921875, -2.06103515625, -1.392578125, -0.72412109375, -0.0556640625, 0.61279296875, 1.28125, 1.94970703125, 2.6181640625, 3.28662109375, 3.955078125, 4.62353515625, 5.2919921875, 5.96044921875, 6.62890625, 7.29736328125, 7.9658203125, 8.63427734375, 9.302734375, 9.97119140625, 10.6396484375, 11.30810546875, 11.9765625, 12.64501953125, 13.3134765625, 13.98193359375, 14.650390625, 15.31884765625, 15.9873046875, 16.65576171875, 17.32421875, 17.99267578125, 18.6611328125, 19.32958984375, 19.998046875, 20.66650390625, 21.3349609375, 22.00341796875, 22.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 17.0, 23.0, 45.0, 83.0, 165.0, 330.0, 1036.0, 5303.0, 173858.0, 852774.0, 12304.0, 1694.0, 469.0, 183.0, 89.0, 54.0, 29.0, 19.0, 13.0, 4.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.8125, -23.135498046875, -22.45849609375, -21.781494140625, -21.1044921875, -20.427490234375, -19.75048828125, -19.073486328125, -18.396484375, -17.719482421875, -17.04248046875, -16.365478515625, -15.6884765625, -15.011474609375, -14.33447265625, -13.657470703125, -12.98046875, -12.303466796875, -11.62646484375, -10.949462890625, -10.2724609375, -9.595458984375, -8.91845703125, -8.241455078125, -7.564453125, -6.887451171875, -6.21044921875, -5.533447265625, -4.8564453125, -4.179443359375, -3.50244140625, -2.825439453125, -2.1484375, -1.471435546875, -0.79443359375, -0.117431640625, 0.5595703125, 1.236572265625, 1.91357421875, 2.590576171875, 3.267578125, 3.944580078125, 4.62158203125, 5.298583984375, 5.9755859375, 6.652587890625, 7.32958984375, 8.006591796875, 8.68359375, 9.360595703125, 10.03759765625, 10.714599609375, 11.3916015625, 12.068603515625, 12.74560546875, 13.422607421875, 14.099609375, 14.776611328125, 15.45361328125, 16.130615234375, 16.8076171875, 17.484619140625, 18.16162109375, 18.838623046875, 19.515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 5.0, 14.0, 7.0, 11.0, 7.0, 12.0, 19.0, 22.0, 14.0, 40.0, 34.0, 56.0, 64.0, 83.0, 118.0, 112.0, 82.0, 49.0, 48.0, 33.0, 28.0, 35.0, 20.0, 17.0, 7.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013256072998046875, -0.0012864917516708374, -0.0012473762035369873, -0.0012082606554031372, -0.0011691451072692871, -0.001130029559135437, -0.001090914011001587, -0.0010517984628677368, -0.0010126829147338867, -0.0009735673666000366, -0.0009344518184661865, -0.0008953362703323364, -0.0008562207221984863, -0.0008171051740646362, -0.0007779896259307861, -0.000738874077796936, -0.0006997585296630859, -0.0006606429815292358, -0.0006215274333953857, -0.0005824118852615356, -0.0005432963371276855, -0.0005041807889938354, -0.00046506524085998535, -0.00042594969272613525, -0.00038683414459228516, -0.00034771859645843506, -0.00030860304832458496, -0.00026948750019073486, -0.00023037195205688477, -0.00019125640392303467, -0.00015214085578918457, -0.00011302530765533447, -7.390975952148438e-05, -3.479421138763428e-05, 4.32133674621582e-06, 4.343688488006592e-05, 8.255243301391602e-05, 0.00012166798114776611, 0.0001607835292816162, 0.0001998990774154663, 0.0002390146255493164, 0.0002781301736831665, 0.0003172457218170166, 0.0003563612699508667, 0.0003954768180847168, 0.0004345923662185669, 0.000473707914352417, 0.0005128234624862671, 0.0005519390106201172, 0.0005910545587539673, 0.0006301701068878174, 0.0006692856550216675, 0.0007084012031555176, 0.0007475167512893677, 0.0007866322994232178, 0.0008257478475570679, 0.000864863395690918, 0.0009039789438247681, 0.0009430944919586182, 0.0009822100400924683, 0.0010213255882263184, 0.0010604411363601685, 0.0010995566844940186, 0.0011386722326278687, 0.0011777877807617188]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 17.0, 20.0, 42.0, 74.0, 167.0, 387.0, 1019.0, 4143.0, 47402.0, 914051.0, 73900.0, 5253.0, 1256.0, 404.0, 179.0, 104.0, 39.0, 26.0, 19.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.2398681640625, -12.721923828125, -12.2039794921875, -11.68603515625, -11.1680908203125, -10.650146484375, -10.1322021484375, -9.6142578125, -9.0963134765625, -8.578369140625, -8.0604248046875, -7.54248046875, -7.0245361328125, -6.506591796875, -5.9886474609375, -5.470703125, -4.9527587890625, -4.434814453125, -3.9168701171875, -3.39892578125, -2.8809814453125, -2.363037109375, -1.8450927734375, -1.3271484375, -0.8092041015625, -0.291259765625, 0.2266845703125, 0.74462890625, 1.2625732421875, 1.780517578125, 2.2984619140625, 2.81640625, 3.3343505859375, 3.852294921875, 4.3702392578125, 4.88818359375, 5.4061279296875, 5.924072265625, 6.4420166015625, 6.9599609375, 7.4779052734375, 7.995849609375, 8.5137939453125, 9.03173828125, 9.5496826171875, 10.067626953125, 10.5855712890625, 11.103515625, 11.6214599609375, 12.139404296875, 12.6573486328125, 13.17529296875, 13.6932373046875, 14.211181640625, 14.7291259765625, 15.2470703125, 15.7650146484375, 16.282958984375, 16.8009033203125, 17.31884765625, 17.8367919921875, 18.354736328125, 18.8726806640625, 19.390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 27.0, 32.0, 41.0, 53.0, 73.0, 81.0, 116.0, 116.0, 104.0, 84.0, 74.0, 38.0, 33.0, 28.0, 14.0, 11.0, 7.0, 9.0, 3.0, 9.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.4442138671875, -5.177490234375, -4.9107666015625, -4.64404296875, -4.3773193359375, -4.110595703125, -3.8438720703125, -3.5771484375, -3.3104248046875, -3.043701171875, -2.7769775390625, -2.51025390625, -2.2435302734375, -1.976806640625, -1.7100830078125, -1.443359375, -1.1766357421875, -0.909912109375, -0.6431884765625, -0.37646484375, -0.1097412109375, 0.156982421875, 0.4237060546875, 0.6904296875, 0.9571533203125, 1.223876953125, 1.4906005859375, 1.75732421875, 2.0240478515625, 2.290771484375, 2.5574951171875, 2.82421875, 3.0909423828125, 3.357666015625, 3.6243896484375, 3.89111328125, 4.1578369140625, 4.424560546875, 4.6912841796875, 4.9580078125, 5.2247314453125, 5.491455078125, 5.7581787109375, 6.02490234375, 6.2916259765625, 6.558349609375, 6.8250732421875, 7.091796875, 7.3585205078125, 7.625244140625, 7.8919677734375, 8.15869140625, 8.4254150390625, 8.692138671875, 8.9588623046875, 9.2255859375, 9.4923095703125, 9.759033203125, 10.0257568359375, 10.29248046875, 10.5592041015625, 10.825927734375, 11.0926513671875, 11.359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 12.0, 17.0, 49.0, 104.0, 149.0, 250.0, 207.0, 108.0, 45.0, 26.0, 14.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.82061767578125, -161.58380126953125, -156.3470001220703, -151.1101837158203, -145.8733673095703, -140.63656616210938, -135.39974975585938, -130.16293334960938, -124.9261245727539, -119.68931579589844, -114.45249938964844, -109.21569061279297, -103.9788818359375, -98.7420654296875, -93.50525665283203, -88.26844787597656, -83.03163146972656, -77.7948226928711, -72.5580062866211, -67.32119750976562, -62.08438491821289, -56.847572326660156, -51.61076354980469, -46.37395095825195, -41.13713836669922, -35.900325775146484, -30.663515090942383, -25.42670440673828, -20.189891815185547, -14.953079223632812, -9.716268539428711, -4.479457855224609, 0.757354736328125, 5.994166374206543, 11.230978012084961, 16.467788696289062, 21.704601287841797, 26.94141387939453, 32.17822265625, 37.415035247802734, 42.65184783935547, 47.8886604309082, 53.12547302246094, 58.362281799316406, 63.59909439086914, 68.83590698242188, 74.07271575927734, 79.30952453613281, 84.54634094238281, 89.78314971923828, 95.01996612548828, 100.25677490234375, 105.49359130859375, 110.73040008544922, 115.96720886230469, 121.20402526855469, 126.44083404541016, 131.67764282226562, 136.91445922851562, 142.15127563476562, 147.38807678222656, 152.62489318847656, 157.86170959472656, 163.0985107421875, 168.3353271484375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 13.0, 18.0, 22.0, 21.0, 35.0, 41.0, 45.0, 43.0, 66.0, 79.0, 79.0, 101.0, 82.0, 57.0, 60.0, 30.0, 47.0, 36.0, 19.0, 21.0, 20.0, 15.0, 9.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-160.51768493652344, -156.69285583496094, -152.8680419921875, -149.043212890625, -145.21839904785156, -141.39356994628906, -137.56875610351562, -133.74392700195312, -129.91909790039062, -126.09427642822266, -122.26945495605469, -118.44462585449219, -114.61980438232422, -110.79498291015625, -106.97016143798828, -103.14533996582031, -99.32052612304688, -95.4957046508789, -91.67088317871094, -87.84605407714844, -84.02123260498047, -80.1964111328125, -76.37158966064453, -72.54676818847656, -68.72193908691406, -64.8971176147461, -61.07229232788086, -57.24747085571289, -53.42264938354492, -49.59782409667969, -45.77300262451172, -41.94818115234375, -38.12335968017578, -34.29853820800781, -30.47371482849121, -26.64889144897461, -22.82406997680664, -18.99924659729004, -15.174423217773438, -11.349601745605469, -7.524778366088867, -3.699955701828003, 0.12486696243286133, 3.9496898651123047, 7.77451229095459, 11.599334716796875, 15.424158096313477, 19.248979568481445, 23.073802947998047, 26.89862632751465, 30.723447799682617, 34.54827117919922, 38.37309265136719, 42.197914123535156, 46.02273941040039, 49.84756088256836, 53.672386169433594, 57.49720764160156, 61.3220329284668, 65.1468505859375, 68.9716796875, 72.79650115966797, 76.62132263183594, 80.4461441040039, 84.27096557617188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 26.0, 26.0, 41.0, 99.0, 174.0, 365.0, 1067.0, 3576.0, 24636.0, 1001600.0, 3099298.0, 55508.0, 5590.0, 1374.0, 479.0, 210.0, 85.0, 48.0, 25.0, 16.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.6083984375, -18.935546875, -18.2626953125, -17.58984375, -16.9169921875, -16.244140625, -15.5712890625, -14.8984375, -14.2255859375, -13.552734375, -12.8798828125, -12.20703125, -11.5341796875, -10.861328125, -10.1884765625, -9.515625, -8.8427734375, -8.169921875, -7.4970703125, -6.82421875, -6.1513671875, -5.478515625, -4.8056640625, -4.1328125, -3.4599609375, -2.787109375, -2.1142578125, -1.44140625, -0.7685546875, -0.095703125, 0.5771484375, 1.25, 1.9228515625, 2.595703125, 3.2685546875, 3.94140625, 4.6142578125, 5.287109375, 5.9599609375, 6.6328125, 7.3056640625, 7.978515625, 8.6513671875, 9.32421875, 9.9970703125, 10.669921875, 11.3427734375, 12.015625, 12.6884765625, 13.361328125, 14.0341796875, 14.70703125, 15.3798828125, 16.052734375, 16.7255859375, 17.3984375, 18.0712890625, 18.744140625, 19.4169921875, 20.08984375, 20.7626953125, 21.435546875, 22.1083984375, 22.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 24.0, 25.0, 36.0, 47.0, 51.0, 38.0, 49.0, 50.0, 61.0, 67.0, 72.0, 55.0, 48.0, 58.0, 62.0, 38.0, 27.0, 22.0, 28.0, 24.0, 18.0, 10.0, 7.0, 7.0, 8.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.71258544921875, -6.5384521484375, -6.36431884765625, -6.190185546875, -6.01605224609375, -5.8419189453125, -5.66778564453125, -5.49365234375, -5.31951904296875, -5.1453857421875, -4.97125244140625, -4.797119140625, -4.62298583984375, -4.4488525390625, -4.27471923828125, -4.1005859375, -3.92645263671875, -3.7523193359375, -3.57818603515625, -3.404052734375, -3.22991943359375, -3.0557861328125, -2.88165283203125, -2.70751953125, -2.53338623046875, -2.3592529296875, -2.18511962890625, -2.010986328125, -1.83685302734375, -1.6627197265625, -1.48858642578125, -1.314453125, -1.14031982421875, -0.9661865234375, -0.79205322265625, -0.617919921875, -0.44378662109375, -0.2696533203125, -0.09552001953125, 0.07861328125, 0.25274658203125, 0.4268798828125, 0.60101318359375, 0.775146484375, 0.94927978515625, 1.1234130859375, 1.29754638671875, 1.4716796875, 1.64581298828125, 1.8199462890625, 1.99407958984375, 2.168212890625, 2.34234619140625, 2.5164794921875, 2.69061279296875, 2.86474609375, 3.03887939453125, 3.2130126953125, 3.38714599609375, 3.561279296875, 3.73541259765625, 3.9095458984375, 4.08367919921875, 4.2578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 10.0, 12.0, 15.0, 24.0, 36.0, 45.0, 40.0, 86.0, 157.0, 282.0, 603.0, 1486.0, 3395.0, 9498.0, 30531.0, 128485.0, 1171253.0, 2531952.0, 243601.0, 49212.0, 14454.0, 5039.0, 2094.0, 908.0, 462.0, 239.0, 108.0, 95.0, 40.0, 37.0, 27.0, 15.0, 7.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.73876953125, -10.4150390625, -10.09130859375, -9.767578125, -9.44384765625, -9.1201171875, -8.79638671875, -8.47265625, -8.14892578125, -7.8251953125, -7.50146484375, -7.177734375, -6.85400390625, -6.5302734375, -6.20654296875, -5.8828125, -5.55908203125, -5.2353515625, -4.91162109375, -4.587890625, -4.26416015625, -3.9404296875, -3.61669921875, -3.29296875, -2.96923828125, -2.6455078125, -2.32177734375, -1.998046875, -1.67431640625, -1.3505859375, -1.02685546875, -0.703125, -0.37939453125, -0.0556640625, 0.26806640625, 0.591796875, 0.91552734375, 1.2392578125, 1.56298828125, 1.88671875, 2.21044921875, 2.5341796875, 2.85791015625, 3.181640625, 3.50537109375, 3.8291015625, 4.15283203125, 4.4765625, 4.80029296875, 5.1240234375, 5.44775390625, 5.771484375, 6.09521484375, 6.4189453125, 6.74267578125, 7.06640625, 7.39013671875, 7.7138671875, 8.03759765625, 8.361328125, 8.68505859375, 9.0087890625, 9.33251953125, 9.65625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 6.0, 12.0, 7.0, 14.0, 13.0, 21.0, 37.0, 30.0, 34.0, 63.0, 101.0, 151.0, 237.0, 308.0, 421.0, 629.0, 590.0, 462.0, 270.0, 201.0, 117.0, 84.0, 68.0, 40.0, 28.0, 27.0, 27.0, 23.0, 13.0, 5.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7969970703125, -9.445556640625, -9.0941162109375, -8.74267578125, -8.3912353515625, -8.039794921875, -7.6883544921875, -7.3369140625, -6.9854736328125, -6.634033203125, -6.2825927734375, -5.93115234375, -5.5797119140625, -5.228271484375, -4.8768310546875, -4.525390625, -4.1739501953125, -3.822509765625, -3.4710693359375, -3.11962890625, -2.7681884765625, -2.416748046875, -2.0653076171875, -1.7138671875, -1.3624267578125, -1.010986328125, -0.6595458984375, -0.30810546875, 0.0433349609375, 0.394775390625, 0.7462158203125, 1.09765625, 1.4490966796875, 1.800537109375, 2.1519775390625, 2.50341796875, 2.8548583984375, 3.206298828125, 3.5577392578125, 3.9091796875, 4.2606201171875, 4.612060546875, 4.9635009765625, 5.31494140625, 5.6663818359375, 6.017822265625, 6.3692626953125, 6.720703125, 7.0721435546875, 7.423583984375, 7.7750244140625, 8.12646484375, 8.4779052734375, 8.829345703125, 9.1807861328125, 9.5322265625, 9.8836669921875, 10.235107421875, 10.5865478515625, 10.93798828125, 11.2894287109375, 11.640869140625, 11.9923095703125, 12.34375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 30.0, 114.0, 323.0, 322.0, 141.0, 35.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.8511962890625, -238.32566833496094, -229.80014038085938, -221.2746124267578, -212.74908447265625, -204.2235565185547, -195.69802856445312, -187.1724853515625, -178.64697265625, -170.12144470214844, -161.59591674804688, -153.0703887939453, -144.54486083984375, -136.0193328857422, -127.4937973022461, -118.96826934814453, -110.44273376464844, -101.91720581054688, -93.39167785644531, -84.86614990234375, -76.34062194824219, -67.81509399414062, -59.28955841064453, -50.76403045654297, -42.238502502441406, -33.712974548339844, -25.18744468688965, -16.661914825439453, -8.13638687133789, 0.3891410827636719, 8.9146728515625, 17.440200805664062, 25.965728759765625, 34.49125671386719, 43.01678466796875, 51.54231643676758, 60.06784439086914, 68.59336853027344, 77.11890411376953, 85.6444320678711, 94.16996002197266, 102.69548797607422, 111.22101593017578, 119.74655151367188, 128.27207946777344, 136.797607421875, 145.32313537597656, 153.84866333007812, 162.3741912841797, 170.89971923828125, 179.4252471923828, 187.95077514648438, 196.47630310058594, 205.0018310546875, 213.52737426757812, 222.05288696289062, 230.57843017578125, 239.1039581298828, 247.62948608398438, 256.155029296875, 264.6805419921875, 273.2060852050781, 281.7315979003906, 290.25714111328125, 298.78265380859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 11.0, 4.0, 5.0, 17.0, 11.0, 17.0, 9.0, 17.0, 21.0, 20.0, 30.0, 30.0, 26.0, 37.0, 38.0, 33.0, 45.0, 47.0, 42.0, 49.0, 49.0, 43.0, 54.0, 43.0, 39.0, 44.0, 33.0, 27.0, 36.0, 28.0, 14.0, 18.0, 10.0, 7.0, 15.0, 2.0, 11.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.165855407714844, -55.31768035888672, -53.469505310058594, -51.62133026123047, -49.773155212402344, -47.92498016357422, -46.076805114746094, -44.22863006591797, -42.380455017089844, -40.53227996826172, -38.684104919433594, -36.83592987060547, -34.987754821777344, -33.13957977294922, -31.29140281677246, -29.443227767944336, -27.595050811767578, -25.746875762939453, -23.898700714111328, -22.050525665283203, -20.202350616455078, -18.354175567626953, -16.505998611450195, -14.65782356262207, -12.809648513793945, -10.96147346496582, -9.113298416137695, -7.265122413635254, -5.416947364807129, -3.568772315979004, -1.7205963134765625, 0.1275787353515625, 1.9757537841796875, 3.8239290714263916, 5.672104358673096, 7.520279884338379, 9.368454933166504, 11.216629981994629, 13.06480598449707, 14.912981033325195, 16.76115608215332, 18.609331130981445, 20.45750617980957, 22.305683135986328, 24.153858184814453, 26.002033233642578, 27.850208282470703, 29.698383331298828, 31.546558380126953, 33.39473342895508, 35.2429084777832, 37.09108352661133, 38.93925857543945, 40.78743362426758, 42.63561248779297, 44.483787536621094, 46.33196258544922, 48.180137634277344, 50.02831268310547, 51.876487731933594, 53.72466278076172, 55.572837829589844, 57.42101287841797, 59.269187927246094, 61.11736297607422]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 10.0, 6.0, 15.0, 23.0, 29.0, 37.0, 63.0, 93.0, 120.0, 244.0, 376.0, 655.0, 1026.0, 1838.0, 3571.0, 7530.0, 16480.0, 38121.0, 91035.0, 220679.0, 351571.0, 181054.0, 75141.0, 31649.0, 13792.0, 6343.0, 3030.0, 1611.0, 908.0, 543.0, 360.0, 200.0, 132.0, 79.0, 44.0, 40.0, 26.0, 20.0, 15.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.953125, -9.655029296875, -9.35693359375, -9.058837890625, -8.7607421875, -8.462646484375, -8.16455078125, -7.866455078125, -7.568359375, -7.270263671875, -6.97216796875, -6.674072265625, -6.3759765625, -6.077880859375, -5.77978515625, -5.481689453125, -5.18359375, -4.885498046875, -4.58740234375, -4.289306640625, -3.9912109375, -3.693115234375, -3.39501953125, -3.096923828125, -2.798828125, -2.500732421875, -2.20263671875, -1.904541015625, -1.6064453125, -1.308349609375, -1.01025390625, -0.712158203125, -0.4140625, -0.115966796875, 0.18212890625, 0.480224609375, 0.7783203125, 1.076416015625, 1.37451171875, 1.672607421875, 1.970703125, 2.268798828125, 2.56689453125, 2.864990234375, 3.1630859375, 3.461181640625, 3.75927734375, 4.057373046875, 4.35546875, 4.653564453125, 4.95166015625, 5.249755859375, 5.5478515625, 5.845947265625, 6.14404296875, 6.442138671875, 6.740234375, 7.038330078125, 7.33642578125, 7.634521484375, 7.9326171875, 8.230712890625, 8.52880859375, 8.826904296875, 9.125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 10.0, 10.0, 15.0, 17.0, 20.0, 28.0, 32.0, 38.0, 33.0, 47.0, 56.0, 55.0, 42.0, 61.0, 55.0, 63.0, 62.0, 55.0, 48.0, 50.0, 40.0, 27.0, 29.0, 28.0, 16.0, 20.0, 7.0, 11.0, 8.0, 5.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6875, -6.5133056640625, -6.339111328125, -6.1649169921875, -5.99072265625, -5.8165283203125, -5.642333984375, -5.4681396484375, -5.2939453125, -5.1197509765625, -4.945556640625, -4.7713623046875, -4.59716796875, -4.4229736328125, -4.248779296875, -4.0745849609375, -3.900390625, -3.7261962890625, -3.552001953125, -3.3778076171875, -3.20361328125, -3.0294189453125, -2.855224609375, -2.6810302734375, -2.5068359375, -2.3326416015625, -2.158447265625, -1.9842529296875, -1.81005859375, -1.6358642578125, -1.461669921875, -1.2874755859375, -1.11328125, -0.9390869140625, -0.764892578125, -0.5906982421875, -0.41650390625, -0.2423095703125, -0.068115234375, 0.1060791015625, 0.2802734375, 0.4544677734375, 0.628662109375, 0.8028564453125, 0.97705078125, 1.1512451171875, 1.325439453125, 1.4996337890625, 1.673828125, 1.8480224609375, 2.022216796875, 2.1964111328125, 2.37060546875, 2.5447998046875, 2.718994140625, 2.8931884765625, 3.0673828125, 3.2415771484375, 3.415771484375, 3.5899658203125, 3.76416015625, 3.9383544921875, 4.112548828125, 4.2867431640625, 4.4609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 14.0, 12.0, 18.0, 26.0, 24.0, 42.0, 77.0, 94.0, 139.0, 241.0, 374.0, 688.0, 1407.0, 3458.0, 15355.0, 238245.0, 744950.0, 34085.0, 5227.0, 1859.0, 866.0, 467.0, 286.0, 207.0, 103.0, 74.0, 53.0, 34.0, 31.0, 19.0, 13.0, 16.0, 6.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.0966796875, -25.099609375, -24.1025390625, -23.10546875, -22.1083984375, -21.111328125, -20.1142578125, -19.1171875, -18.1201171875, -17.123046875, -16.1259765625, -15.12890625, -14.1318359375, -13.134765625, -12.1376953125, -11.140625, -10.1435546875, -9.146484375, -8.1494140625, -7.15234375, -6.1552734375, -5.158203125, -4.1611328125, -3.1640625, -2.1669921875, -1.169921875, -0.1728515625, 0.82421875, 1.8212890625, 2.818359375, 3.8154296875, 4.8125, 5.8095703125, 6.806640625, 7.8037109375, 8.80078125, 9.7978515625, 10.794921875, 11.7919921875, 12.7890625, 13.7861328125, 14.783203125, 15.7802734375, 16.77734375, 17.7744140625, 18.771484375, 19.7685546875, 20.765625, 21.7626953125, 22.759765625, 23.7568359375, 24.75390625, 25.7509765625, 26.748046875, 27.7451171875, 28.7421875, 29.7392578125, 30.736328125, 31.7333984375, 32.73046875, 33.7275390625, 34.724609375, 35.7216796875, 36.71875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 14.0, 14.0, 14.0, 22.0, 13.0, 32.0, 27.0, 34.0, 39.0, 35.0, 47.0, 40.0, 40.0, 51.0, 49.0, 48.0, 48.0, 53.0, 39.0, 44.0, 42.0, 44.0, 26.0, 20.0, 30.0, 24.0, 18.0, 16.0, 15.0, 9.0, 11.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.209716796875, -21.56005859375, -20.910400390625, -20.2607421875, -19.611083984375, -18.96142578125, -18.311767578125, -17.662109375, -17.012451171875, -16.36279296875, -15.713134765625, -15.0634765625, -14.413818359375, -13.76416015625, -13.114501953125, -12.46484375, -11.815185546875, -11.16552734375, -10.515869140625, -9.8662109375, -9.216552734375, -8.56689453125, -7.917236328125, -7.267578125, -6.617919921875, -5.96826171875, -5.318603515625, -4.6689453125, -4.019287109375, -3.36962890625, -2.719970703125, -2.0703125, -1.420654296875, -0.77099609375, -0.121337890625, 0.5283203125, 1.177978515625, 1.82763671875, 2.477294921875, 3.126953125, 3.776611328125, 4.42626953125, 5.075927734375, 5.7255859375, 6.375244140625, 7.02490234375, 7.674560546875, 8.32421875, 8.973876953125, 9.62353515625, 10.273193359375, 10.9228515625, 11.572509765625, 12.22216796875, 12.871826171875, 13.521484375, 14.171142578125, 14.82080078125, 15.470458984375, 16.1201171875, 16.769775390625, 17.41943359375, 18.069091796875, 18.71875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 23.0, 22.0, 31.0, 51.0, 77.0, 149.0, 263.0, 527.0, 1732.0, 7142.0, 56543.0, 784221.0, 176974.0, 16054.0, 2977.0, 923.0, 340.0, 186.0, 98.0, 60.0, 29.0, 17.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.9046630859375, -10.590576171875, -10.2764892578125, -9.96240234375, -9.6483154296875, -9.334228515625, -9.0201416015625, -8.7060546875, -8.3919677734375, -8.077880859375, -7.7637939453125, -7.44970703125, -7.1356201171875, -6.821533203125, -6.5074462890625, -6.193359375, -5.8792724609375, -5.565185546875, -5.2510986328125, -4.93701171875, -4.6229248046875, -4.308837890625, -3.9947509765625, -3.6806640625, -3.3665771484375, -3.052490234375, -2.7384033203125, -2.42431640625, -2.1102294921875, -1.796142578125, -1.4820556640625, -1.16796875, -0.8538818359375, -0.539794921875, -0.2257080078125, 0.08837890625, 0.4024658203125, 0.716552734375, 1.0306396484375, 1.3447265625, 1.6588134765625, 1.972900390625, 2.2869873046875, 2.60107421875, 2.9151611328125, 3.229248046875, 3.5433349609375, 3.857421875, 4.1715087890625, 4.485595703125, 4.7996826171875, 5.11376953125, 5.4278564453125, 5.741943359375, 6.0560302734375, 6.3701171875, 6.6842041015625, 6.998291015625, 7.3123779296875, 7.62646484375, 7.9405517578125, 8.254638671875, 8.5687255859375, 8.8828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 18.0, 31.0, 33.0, 52.0, 55.0, 98.0, 165.0, 182.0, 79.0, 75.0, 49.0, 23.0, 32.0, 15.0, 16.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002140045166015625, -0.0020686984062194824, -0.00199735164642334, -0.0019260048866271973, -0.0018546581268310547, -0.0017833113670349121, -0.0017119646072387695, -0.001640617847442627, -0.0015692710876464844, -0.0014979243278503418, -0.0014265775680541992, -0.0013552308082580566, -0.001283884048461914, -0.0012125372886657715, -0.001141190528869629, -0.0010698437690734863, -0.0009984970092773438, -0.0009271502494812012, -0.0008558034896850586, -0.000784456729888916, -0.0007131099700927734, -0.0006417632102966309, -0.0005704164505004883, -0.0004990696907043457, -0.0004277229309082031, -0.00035637617111206055, -0.00028502941131591797, -0.0002136826515197754, -0.0001423358917236328, -7.098913192749023e-05, 3.5762786865234375e-07, 7.170438766479492e-05, 0.0001430511474609375, 0.00021439790725708008, 0.00028574466705322266, 0.00035709142684936523, 0.0004284381866455078, 0.0004997849464416504, 0.000571131706237793, 0.0006424784660339355, 0.0007138252258300781, 0.0007851719856262207, 0.0008565187454223633, 0.0009278655052185059, 0.0009992122650146484, 0.001070559024810791, 0.0011419057846069336, 0.0012132525444030762, 0.0012845993041992188, 0.0013559460639953613, 0.001427292823791504, 0.0014986395835876465, 0.001569986343383789, 0.0016413331031799316, 0.0017126798629760742, 0.0017840266227722168, 0.0018553733825683594, 0.001926720142364502, 0.0019980669021606445, 0.002069413661956787, 0.0021407604217529297, 0.0022121071815490723, 0.002283453941345215, 0.0023548007011413574, 0.0024261474609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 22.0, 25.0, 32.0, 33.0, 73.0, 113.0, 188.0, 363.0, 685.0, 1412.0, 3950.0, 15950.0, 136435.0, 797670.0, 74790.0, 11315.0, 3037.0, 1130.0, 563.0, 283.0, 147.0, 99.0, 57.0, 52.0, 26.0, 19.0, 17.0, 19.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.5234375, -8.242919921875, -7.96240234375, -7.681884765625, -7.4013671875, -7.120849609375, -6.84033203125, -6.559814453125, -6.279296875, -5.998779296875, -5.71826171875, -5.437744140625, -5.1572265625, -4.876708984375, -4.59619140625, -4.315673828125, -4.03515625, -3.754638671875, -3.47412109375, -3.193603515625, -2.9130859375, -2.632568359375, -2.35205078125, -2.071533203125, -1.791015625, -1.510498046875, -1.22998046875, -0.949462890625, -0.6689453125, -0.388427734375, -0.10791015625, 0.172607421875, 0.453125, 0.733642578125, 1.01416015625, 1.294677734375, 1.5751953125, 1.855712890625, 2.13623046875, 2.416748046875, 2.697265625, 2.977783203125, 3.25830078125, 3.538818359375, 3.8193359375, 4.099853515625, 4.38037109375, 4.660888671875, 4.94140625, 5.221923828125, 5.50244140625, 5.782958984375, 6.0634765625, 6.343994140625, 6.62451171875, 6.905029296875, 7.185546875, 7.466064453125, 7.74658203125, 8.027099609375, 8.3076171875, 8.588134765625, 8.86865234375, 9.149169921875, 9.4296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 2.0, 4.0, 6.0, 8.0, 12.0, 10.0, 16.0, 26.0, 22.0, 21.0, 27.0, 37.0, 36.0, 48.0, 54.0, 52.0, 71.0, 77.0, 72.0, 46.0, 54.0, 47.0, 37.0, 42.0, 29.0, 23.0, 15.0, 24.0, 12.0, 8.0, 5.0, 12.0, 7.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.37896728515625, -4.2344970703125, -4.09002685546875, -3.945556640625, -3.80108642578125, -3.6566162109375, -3.51214599609375, -3.36767578125, -3.22320556640625, -3.0787353515625, -2.93426513671875, -2.789794921875, -2.64532470703125, -2.5008544921875, -2.35638427734375, -2.2119140625, -2.06744384765625, -1.9229736328125, -1.77850341796875, -1.634033203125, -1.48956298828125, -1.3450927734375, -1.20062255859375, -1.05615234375, -0.91168212890625, -0.7672119140625, -0.62274169921875, -0.478271484375, -0.33380126953125, -0.1893310546875, -0.04486083984375, 0.099609375, 0.24407958984375, 0.3885498046875, 0.53302001953125, 0.677490234375, 0.82196044921875, 0.9664306640625, 1.11090087890625, 1.25537109375, 1.39984130859375, 1.5443115234375, 1.68878173828125, 1.833251953125, 1.97772216796875, 2.1221923828125, 2.26666259765625, 2.4111328125, 2.55560302734375, 2.7000732421875, 2.84454345703125, 2.989013671875, 3.13348388671875, 3.2779541015625, 3.42242431640625, 3.56689453125, 3.71136474609375, 3.8558349609375, 4.00030517578125, 4.144775390625, 4.28924560546875, 4.4337158203125, 4.57818603515625, 4.72265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 13.0, 15.0, 35.0, 79.0, 123.0, 205.0, 244.0, 124.0, 81.0, 37.0, 14.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.18331909179688, -122.13169860839844, -117.08008575439453, -112.0284652709961, -106.97685241699219, -101.92523193359375, -96.87361145019531, -91.8219985961914, -86.7703857421875, -81.71876525878906, -76.66715240478516, -71.61553192138672, -66.56391906738281, -61.512298583984375, -56.4606819152832, -51.40906524658203, -46.357444763183594, -41.30582809448242, -36.25421142578125, -31.202592849731445, -26.150976181030273, -21.0993595123291, -16.047740936279297, -10.996124267578125, -5.944507598876953, -0.892890453338623, 4.158726692199707, 9.210344314575195, 14.261960983276367, 19.31357765197754, 24.365196228027344, 29.416812896728516, 34.46842956542969, 39.52004623413086, 44.57166290283203, 49.62328338623047, 54.674896240234375, 59.72651672363281, 64.77813720703125, 69.82975006103516, 74.88136291503906, 79.9329833984375, 84.9845962524414, 90.03621673583984, 95.08782958984375, 100.13945007324219, 105.19107055664062, 110.24268341064453, 115.29430389404297, 120.3459243774414, 125.39753723144531, 130.44915771484375, 135.5007781982422, 140.55238342285156, 145.60400390625, 150.65562438964844, 155.70724487304688, 160.7588653564453, 165.81048583984375, 170.86209106445312, 175.91371154785156, 180.96533203125, 186.01695251464844, 191.06857299804688, 196.12017822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 12.0, 8.0, 17.0, 21.0, 26.0, 20.0, 31.0, 54.0, 36.0, 50.0, 58.0, 83.0, 78.0, 91.0, 65.0, 39.0, 33.0, 33.0, 34.0, 27.0, 26.0, 23.0, 25.0, 22.0, 13.0, 12.0, 6.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.29074096679688, -74.36323547363281, -71.43572998046875, -68.50822448730469, -65.58071899414062, -62.65321350097656, -59.7257080078125, -56.79820251464844, -53.870697021484375, -50.94319152832031, -48.01568603515625, -45.08818054199219, -42.160675048828125, -39.23316955566406, -36.3056640625, -33.37815856933594, -30.45065689086914, -27.523151397705078, -24.595645904541016, -21.668140411376953, -18.74063491821289, -15.813130378723145, -12.885625839233398, -9.958120346069336, -7.030614852905273, -4.103109359741211, -1.1756043434143066, 1.7519006729125977, 4.67940616607666, 7.606911659240723, 10.534416198730469, 13.461921691894531, 16.389427185058594, 19.316932678222656, 22.24443817138672, 25.17194366455078, 28.099449157714844, 31.026954650878906, 33.95446014404297, 36.88196563720703, 39.809471130371094, 42.736976623535156, 45.66448211669922, 48.59198760986328, 51.519493103027344, 54.446998596191406, 57.37450408935547, 60.30200958251953, 63.22951126098633, 66.15701293945312, 69.08451843261719, 72.01202392578125, 74.93952941894531, 77.86703491210938, 80.79454040527344, 83.7220458984375, 86.64955139160156, 89.57705688476562, 92.50456237792969, 95.43206787109375, 98.35957336425781, 101.28707885742188, 104.21458435058594, 107.14208984375, 110.06959533691406]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 15.0, 19.0, 33.0, 58.0, 80.0, 174.0, 324.0, 647.0, 1454.0, 3814.0, 12065.0, 51723.0, 484646.0, 3132719.0, 439709.0, 49175.0, 11404.0, 3646.0, 1339.0, 574.0, 295.0, 156.0, 82.0, 44.0, 29.0, 19.0, 13.0, 10.0, 5.0, 2.0, 6.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.90087890625, -7.5908203125, -7.28076171875, -6.970703125, -6.66064453125, -6.3505859375, -6.04052734375, -5.73046875, -5.42041015625, -5.1103515625, -4.80029296875, -4.490234375, -4.18017578125, -3.8701171875, -3.56005859375, -3.25, -2.93994140625, -2.6298828125, -2.31982421875, -2.009765625, -1.69970703125, -1.3896484375, -1.07958984375, -0.76953125, -0.45947265625, -0.1494140625, 0.16064453125, 0.470703125, 0.78076171875, 1.0908203125, 1.40087890625, 1.7109375, 2.02099609375, 2.3310546875, 2.64111328125, 2.951171875, 3.26123046875, 3.5712890625, 3.88134765625, 4.19140625, 4.50146484375, 4.8115234375, 5.12158203125, 5.431640625, 5.74169921875, 6.0517578125, 6.36181640625, 6.671875, 6.98193359375, 7.2919921875, 7.60205078125, 7.912109375, 8.22216796875, 8.5322265625, 8.84228515625, 9.15234375, 9.46240234375, 9.7724609375, 10.08251953125, 10.392578125, 10.70263671875, 11.0126953125, 11.32275390625, 11.6328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 10.0, 18.0, 24.0, 24.0, 21.0, 34.0, 37.0, 42.0, 61.0, 76.0, 51.0, 57.0, 61.0, 54.0, 60.0, 64.0, 61.0, 46.0, 32.0, 35.0, 20.0, 28.0, 16.0, 14.0, 4.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -3.97509765625, -3.7900390625, -3.60498046875, -3.419921875, -3.23486328125, -3.0498046875, -2.86474609375, -2.6796875, -2.49462890625, -2.3095703125, -2.12451171875, -1.939453125, -1.75439453125, -1.5693359375, -1.38427734375, -1.19921875, -1.01416015625, -0.8291015625, -0.64404296875, -0.458984375, -0.27392578125, -0.0888671875, 0.09619140625, 0.28125, 0.46630859375, 0.6513671875, 0.83642578125, 1.021484375, 1.20654296875, 1.3916015625, 1.57666015625, 1.76171875, 1.94677734375, 2.1318359375, 2.31689453125, 2.501953125, 2.68701171875, 2.8720703125, 3.05712890625, 3.2421875, 3.42724609375, 3.6123046875, 3.79736328125, 3.982421875, 4.16748046875, 4.3525390625, 4.53759765625, 4.72265625, 4.90771484375, 5.0927734375, 5.27783203125, 5.462890625, 5.64794921875, 5.8330078125, 6.01806640625, 6.203125, 6.38818359375, 6.5732421875, 6.75830078125, 6.943359375, 7.12841796875, 7.3134765625, 7.49853515625, 7.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 16.0, 38.0, 65.0, 107.0, 231.0, 671.0, 2224.0, 11850.0, 132969.0, 3788168.0, 235660.0, 17740.0, 3082.0, 907.0, 296.0, 132.0, 63.0, 24.0, 8.0, 11.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.766357421875, -16.11083984375, -15.455322265625, -14.7998046875, -14.144287109375, -13.48876953125, -12.833251953125, -12.177734375, -11.522216796875, -10.86669921875, -10.211181640625, -9.5556640625, -8.900146484375, -8.24462890625, -7.589111328125, -6.93359375, -6.278076171875, -5.62255859375, -4.967041015625, -4.3115234375, -3.656005859375, -3.00048828125, -2.344970703125, -1.689453125, -1.033935546875, -0.37841796875, 0.277099609375, 0.9326171875, 1.588134765625, 2.24365234375, 2.899169921875, 3.5546875, 4.210205078125, 4.86572265625, 5.521240234375, 6.1767578125, 6.832275390625, 7.48779296875, 8.143310546875, 8.798828125, 9.454345703125, 10.10986328125, 10.765380859375, 11.4208984375, 12.076416015625, 12.73193359375, 13.387451171875, 14.04296875, 14.698486328125, 15.35400390625, 16.009521484375, 16.6650390625, 17.320556640625, 17.97607421875, 18.631591796875, 19.287109375, 19.942626953125, 20.59814453125, 21.253662109375, 21.9091796875, 22.564697265625, 23.22021484375, 23.875732421875, 24.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 13.0, 17.0, 20.0, 36.0, 62.0, 81.0, 123.0, 279.0, 527.0, 962.0, 866.0, 461.0, 224.0, 127.0, 82.0, 59.0, 30.0, 26.0, 23.0, 14.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.23974609375, -16.7451171875, -16.25048828125, -15.755859375, -15.26123046875, -14.7666015625, -14.27197265625, -13.77734375, -13.28271484375, -12.7880859375, -12.29345703125, -11.798828125, -11.30419921875, -10.8095703125, -10.31494140625, -9.8203125, -9.32568359375, -8.8310546875, -8.33642578125, -7.841796875, -7.34716796875, -6.8525390625, -6.35791015625, -5.86328125, -5.36865234375, -4.8740234375, -4.37939453125, -3.884765625, -3.39013671875, -2.8955078125, -2.40087890625, -1.90625, -1.41162109375, -0.9169921875, -0.42236328125, 0.072265625, 0.56689453125, 1.0615234375, 1.55615234375, 2.05078125, 2.54541015625, 3.0400390625, 3.53466796875, 4.029296875, 4.52392578125, 5.0185546875, 5.51318359375, 6.0078125, 6.50244140625, 6.9970703125, 7.49169921875, 7.986328125, 8.48095703125, 8.9755859375, 9.47021484375, 9.96484375, 10.45947265625, 10.9541015625, 11.44873046875, 11.943359375, 12.43798828125, 12.9326171875, 13.42724609375, 13.921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 8.0, 26.0, 82.0, 198.0, 315.0, 224.0, 87.0, 29.0, 14.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.4720458984375, -174.14645385742188, -167.82086181640625, -161.49526977539062, -155.169677734375, -148.84408569335938, -142.51849365234375, -136.19290161132812, -129.8673095703125, -123.54171752929688, -117.21612548828125, -110.89053344726562, -104.56494140625, -98.23934936523438, -91.91375732421875, -85.58816528320312, -79.2625732421875, -72.93698120117188, -66.61138916015625, -60.285797119140625, -53.960205078125, -47.634613037109375, -41.30902099609375, -34.983428955078125, -28.6578369140625, -22.332244873046875, -16.00665283203125, -9.681060791015625, -3.35546875, 2.970123291015625, 9.29571533203125, 15.621307373046875, 21.946914672851562, 28.272506713867188, 34.59809875488281, 40.92369079589844, 47.24928283691406, 53.57487487792969, 59.90046691894531, 66.22605895996094, 72.55165100097656, 78.87724304199219, 85.20283508300781, 91.52842712402344, 97.85401916503906, 104.17961120605469, 110.50520324707031, 116.83079528808594, 123.15638732910156, 129.4819793701172, 135.8075714111328, 142.13316345214844, 148.45875549316406, 154.7843475341797, 161.1099395751953, 167.43553161621094, 173.76112365722656, 180.0867156982422, 186.4123077392578, 192.73789978027344, 199.06349182128906, 205.3890838623047, 211.7146759033203, 218.04026794433594, 224.36585998535156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 6.0, 8.0, 10.0, 16.0, 23.0, 19.0, 25.0, 26.0, 39.0, 26.0, 34.0, 38.0, 52.0, 50.0, 49.0, 67.0, 39.0, 42.0, 54.0, 49.0, 48.0, 50.0, 34.0, 29.0, 24.0, 24.0, 27.0, 15.0, 21.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.355377197265625, -60.53413009643555, -58.712886810302734, -56.891639709472656, -55.07039260864258, -53.2491455078125, -51.42790222167969, -49.60665512084961, -47.78540802001953, -45.96416091918945, -44.14291763305664, -42.32167053222656, -40.500423431396484, -38.679176330566406, -36.857933044433594, -35.036685943603516, -33.2154426574707, -31.394197463989258, -29.57295036315918, -27.751705169677734, -25.930458068847656, -24.10921287536621, -22.287967681884766, -20.466720581054688, -18.645475387573242, -16.824230194091797, -15.002983093261719, -13.181737899780273, -11.360491752624512, -9.53924560546875, -7.718000411987305, -5.896754264831543, -4.075504302978516, -2.254258394241333, -0.4330124855041504, 1.3882331848144531, 3.209479331970215, 5.030725479125977, 6.851970672607422, 8.673216819763184, 10.494462966918945, 12.315709114074707, 14.136955261230469, 15.958200454711914, 17.77944564819336, 19.600692749023438, 21.421937942504883, 23.243183135986328, 25.064430236816406, 26.88567543029785, 28.70692253112793, 30.528167724609375, 32.34941482543945, 34.17066192626953, 35.991905212402344, 37.81315231323242, 39.6343994140625, 41.45564651489258, 43.27688980102539, 45.09813690185547, 46.91938400268555, 48.740631103515625, 50.56187438964844, 52.383121490478516, 54.20436477661133]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 4.0, 7.0, 8.0, 17.0, 24.0, 36.0, 57.0, 77.0, 92.0, 190.0, 268.0, 403.0, 724.0, 1280.0, 2298.0, 4203.0, 8083.0, 16293.0, 35068.0, 82466.0, 218229.0, 365207.0, 182493.0, 70507.0, 30319.0, 14310.0, 7268.0, 3697.0, 2020.0, 1124.0, 661.0, 387.0, 248.0, 151.0, 101.0, 70.0, 45.0, 24.0, 13.0, 20.0, 26.0, 8.0, 0.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.948486328125, -7.67822265625, -7.407958984375, -7.1376953125, -6.867431640625, -6.59716796875, -6.326904296875, -6.056640625, -5.786376953125, -5.51611328125, -5.245849609375, -4.9755859375, -4.705322265625, -4.43505859375, -4.164794921875, -3.89453125, -3.624267578125, -3.35400390625, -3.083740234375, -2.8134765625, -2.543212890625, -2.27294921875, -2.002685546875, -1.732421875, -1.462158203125, -1.19189453125, -0.921630859375, -0.6513671875, -0.381103515625, -0.11083984375, 0.159423828125, 0.4296875, 0.699951171875, 0.97021484375, 1.240478515625, 1.5107421875, 1.781005859375, 2.05126953125, 2.321533203125, 2.591796875, 2.862060546875, 3.13232421875, 3.402587890625, 3.6728515625, 3.943115234375, 4.21337890625, 4.483642578125, 4.75390625, 5.024169921875, 5.29443359375, 5.564697265625, 5.8349609375, 6.105224609375, 6.37548828125, 6.645751953125, 6.916015625, 7.186279296875, 7.45654296875, 7.726806640625, 7.9970703125, 8.267333984375, 8.53759765625, 8.807861328125, 9.078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 5.0, 10.0, 7.0, 15.0, 14.0, 14.0, 29.0, 17.0, 29.0, 20.0, 30.0, 31.0, 45.0, 38.0, 40.0, 46.0, 45.0, 46.0, 53.0, 40.0, 41.0, 45.0, 50.0, 31.0, 37.0, 31.0, 26.0, 17.0, 26.0, 18.0, 21.0, 14.0, 4.0, 7.0, 9.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.953125, -3.8155517578125, -3.677978515625, -3.5404052734375, -3.40283203125, -3.2652587890625, -3.127685546875, -2.9901123046875, -2.8525390625, -2.7149658203125, -2.577392578125, -2.4398193359375, -2.30224609375, -2.1646728515625, -2.027099609375, -1.8895263671875, -1.751953125, -1.6143798828125, -1.476806640625, -1.3392333984375, -1.20166015625, -1.0640869140625, -0.926513671875, -0.7889404296875, -0.6513671875, -0.5137939453125, -0.376220703125, -0.2386474609375, -0.10107421875, 0.0364990234375, 0.174072265625, 0.3116455078125, 0.44921875, 0.5867919921875, 0.724365234375, 0.8619384765625, 0.99951171875, 1.1370849609375, 1.274658203125, 1.4122314453125, 1.5498046875, 1.6873779296875, 1.824951171875, 1.9625244140625, 2.10009765625, 2.2376708984375, 2.375244140625, 2.5128173828125, 2.650390625, 2.7879638671875, 2.925537109375, 3.0631103515625, 3.20068359375, 3.3382568359375, 3.475830078125, 3.6134033203125, 3.7509765625, 3.8885498046875, 4.026123046875, 4.1636962890625, 4.30126953125, 4.4388427734375, 4.576416015625, 4.7139892578125, 4.8515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 21.0, 29.0, 58.0, 82.0, 106.0, 178.0, 271.0, 516.0, 971.0, 2150.0, 6679.0, 44688.0, 776216.0, 193468.0, 16181.0, 3687.0, 1408.0, 725.0, 428.0, 204.0, 159.0, 100.0, 58.0, 44.0, 25.0, 16.0, 16.0, 9.0, 9.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.84375, -31.950439453125, -31.05712890625, -30.163818359375, -29.2705078125, -28.377197265625, -27.48388671875, -26.590576171875, -25.697265625, -24.803955078125, -23.91064453125, -23.017333984375, -22.1240234375, -21.230712890625, -20.33740234375, -19.444091796875, -18.55078125, -17.657470703125, -16.76416015625, -15.870849609375, -14.9775390625, -14.084228515625, -13.19091796875, -12.297607421875, -11.404296875, -10.510986328125, -9.61767578125, -8.724365234375, -7.8310546875, -6.937744140625, -6.04443359375, -5.151123046875, -4.2578125, -3.364501953125, -2.47119140625, -1.577880859375, -0.6845703125, 0.208740234375, 1.10205078125, 1.995361328125, 2.888671875, 3.781982421875, 4.67529296875, 5.568603515625, 6.4619140625, 7.355224609375, 8.24853515625, 9.141845703125, 10.03515625, 10.928466796875, 11.82177734375, 12.715087890625, 13.6083984375, 14.501708984375, 15.39501953125, 16.288330078125, 17.181640625, 18.074951171875, 18.96826171875, 19.861572265625, 20.7548828125, 21.648193359375, 22.54150390625, 23.434814453125, 24.328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 12.0, 10.0, 15.0, 29.0, 28.0, 38.0, 35.0, 38.0, 46.0, 57.0, 68.0, 54.0, 69.0, 71.0, 59.0, 50.0, 43.0, 42.0, 52.0, 42.0, 20.0, 27.0, 17.0, 21.0, 13.0, 13.0, 11.0, 4.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.673828125, -17.92578125, -17.177734375, -16.4296875, -15.681640625, -14.93359375, -14.185546875, -13.4375, -12.689453125, -11.94140625, -11.193359375, -10.4453125, -9.697265625, -8.94921875, -8.201171875, -7.453125, -6.705078125, -5.95703125, -5.208984375, -4.4609375, -3.712890625, -2.96484375, -2.216796875, -1.46875, -0.720703125, 0.02734375, 0.775390625, 1.5234375, 2.271484375, 3.01953125, 3.767578125, 4.515625, 5.263671875, 6.01171875, 6.759765625, 7.5078125, 8.255859375, 9.00390625, 9.751953125, 10.5, 11.248046875, 11.99609375, 12.744140625, 13.4921875, 14.240234375, 14.98828125, 15.736328125, 16.484375, 17.232421875, 17.98046875, 18.728515625, 19.4765625, 20.224609375, 20.97265625, 21.720703125, 22.46875, 23.216796875, 23.96484375, 24.712890625, 25.4609375, 26.208984375, 26.95703125, 27.705078125, 28.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 11.0, 8.0, 14.0, 17.0, 11.0, 18.0, 37.0, 54.0, 92.0, 155.0, 374.0, 1013.0, 3885.0, 28594.0, 742841.0, 252117.0, 15242.0, 2585.0, 797.0, 269.0, 167.0, 78.0, 46.0, 28.0, 25.0, 16.0, 7.0, 8.0, 9.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.4580078125, -10.095703125, -9.7333984375, -9.37109375, -9.0087890625, -8.646484375, -8.2841796875, -7.921875, -7.5595703125, -7.197265625, -6.8349609375, -6.47265625, -6.1103515625, -5.748046875, -5.3857421875, -5.0234375, -4.6611328125, -4.298828125, -3.9365234375, -3.57421875, -3.2119140625, -2.849609375, -2.4873046875, -2.125, -1.7626953125, -1.400390625, -1.0380859375, -0.67578125, -0.3134765625, 0.048828125, 0.4111328125, 0.7734375, 1.1357421875, 1.498046875, 1.8603515625, 2.22265625, 2.5849609375, 2.947265625, 3.3095703125, 3.671875, 4.0341796875, 4.396484375, 4.7587890625, 5.12109375, 5.4833984375, 5.845703125, 6.2080078125, 6.5703125, 6.9326171875, 7.294921875, 7.6572265625, 8.01953125, 8.3818359375, 8.744140625, 9.1064453125, 9.46875, 9.8310546875, 10.193359375, 10.5556640625, 10.91796875, 11.2802734375, 11.642578125, 12.0048828125, 12.3671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 9.0, 7.0, 11.0, 18.0, 14.0, 12.0, 17.0, 26.0, 27.0, 38.0, 61.0, 87.0, 134.0, 117.0, 104.0, 66.0, 50.0, 36.0, 34.0, 22.0, 14.0, 23.0, 11.0, 14.0, 6.0, 10.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.001171410083770752, -0.001129746437072754, -0.0010880827903747559, -0.0010464191436767578, -0.0010047554969787598, -0.0009630918502807617, -0.0009214282035827637, -0.0008797645568847656, -0.0008381009101867676, -0.0007964372634887695, -0.0007547736167907715, -0.0007131099700927734, -0.0006714463233947754, -0.0006297826766967773, -0.0005881190299987793, -0.0005464553833007812, -0.0005047917366027832, -0.00046312808990478516, -0.0004214644432067871, -0.00037980079650878906, -0.000338137149810791, -0.00029647350311279297, -0.0002548098564147949, -0.00021314620971679688, -0.00017148256301879883, -0.00012981891632080078, -8.815526962280273e-05, -4.649162292480469e-05, -4.827976226806641e-06, 3.6835670471191406e-05, 7.849931716918945e-05, 0.0001201629638671875, 0.00016182661056518555, 0.0002034902572631836, 0.00024515390396118164, 0.0002868175506591797, 0.00032848119735717773, 0.0003701448440551758, 0.00041180849075317383, 0.0004534721374511719, 0.0004951357841491699, 0.000536799430847168, 0.000578463077545166, 0.0006201267242431641, 0.0006617903709411621, 0.0007034540176391602, 0.0007451176643371582, 0.0007867813110351562, 0.0008284449577331543, 0.0008701086044311523, 0.0009117722511291504, 0.0009534358978271484, 0.0009950995445251465, 0.0010367631912231445, 0.0010784268379211426, 0.0011200904846191406, 0.0011617541313171387, 0.0012034177780151367, 0.0012450814247131348, 0.0012867450714111328, 0.0013284087181091309, 0.001370072364807129, 0.001411736011505127, 0.001453399658203125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 17.0, 16.0, 21.0, 46.0, 56.0, 98.0, 161.0, 306.0, 522.0, 1017.0, 2680.0, 9627.0, 65954.0, 790962.0, 153977.0, 16450.0, 3839.0, 1331.0, 634.0, 331.0, 178.0, 135.0, 62.0, 43.0, 34.0, 15.0, 16.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.0352783203125, -7.781494140625, -7.5277099609375, -7.27392578125, -7.0201416015625, -6.766357421875, -6.5125732421875, -6.2587890625, -6.0050048828125, -5.751220703125, -5.4974365234375, -5.24365234375, -4.9898681640625, -4.736083984375, -4.4822998046875, -4.228515625, -3.9747314453125, -3.720947265625, -3.4671630859375, -3.21337890625, -2.9595947265625, -2.705810546875, -2.4520263671875, -2.1982421875, -1.9444580078125, -1.690673828125, -1.4368896484375, -1.18310546875, -0.9293212890625, -0.675537109375, -0.4217529296875, -0.16796875, 0.0858154296875, 0.339599609375, 0.5933837890625, 0.84716796875, 1.1009521484375, 1.354736328125, 1.6085205078125, 1.8623046875, 2.1160888671875, 2.369873046875, 2.6236572265625, 2.87744140625, 3.1312255859375, 3.385009765625, 3.6387939453125, 3.892578125, 4.1463623046875, 4.400146484375, 4.6539306640625, 4.90771484375, 5.1614990234375, 5.415283203125, 5.6690673828125, 5.9228515625, 6.1766357421875, 6.430419921875, 6.6842041015625, 6.93798828125, 7.1917724609375, 7.445556640625, 7.6993408203125, 7.953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 14.0, 14.0, 24.0, 24.0, 30.0, 38.0, 49.0, 57.0, 82.0, 102.0, 93.0, 94.0, 73.0, 55.0, 54.0, 35.0, 25.0, 32.0, 17.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.57421875, -5.402587890625, -5.23095703125, -5.059326171875, -4.8876953125, -4.716064453125, -4.54443359375, -4.372802734375, -4.201171875, -4.029541015625, -3.85791015625, -3.686279296875, -3.5146484375, -3.343017578125, -3.17138671875, -2.999755859375, -2.828125, -2.656494140625, -2.48486328125, -2.313232421875, -2.1416015625, -1.969970703125, -1.79833984375, -1.626708984375, -1.455078125, -1.283447265625, -1.11181640625, -0.940185546875, -0.7685546875, -0.596923828125, -0.42529296875, -0.253662109375, -0.08203125, 0.089599609375, 0.26123046875, 0.432861328125, 0.6044921875, 0.776123046875, 0.94775390625, 1.119384765625, 1.291015625, 1.462646484375, 1.63427734375, 1.805908203125, 1.9775390625, 2.149169921875, 2.32080078125, 2.492431640625, 2.6640625, 2.835693359375, 3.00732421875, 3.178955078125, 3.3505859375, 3.522216796875, 3.69384765625, 3.865478515625, 4.037109375, 4.208740234375, 4.38037109375, 4.552001953125, 4.7236328125, 4.895263671875, 5.06689453125, 5.238525390625, 5.41015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 14.0, 27.0, 78.0, 142.0, 314.0, 203.0, 101.0, 49.0, 27.0, 8.0, 8.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.22621154785156, -149.6083526611328, -143.99050903320312, -138.37265014648438, -132.75479125976562, -127.1369400024414, -121.51908874511719, -115.90122985839844, -110.28337860107422, -104.66552734375, -99.04766845703125, -93.42981719970703, -87.81196594238281, -82.19410705566406, -76.57625579833984, -70.95840454101562, -65.34054565429688, -59.72269058227539, -54.104835510253906, -48.48698425292969, -42.8691291809082, -37.25127410888672, -31.6334228515625, -26.015567779541016, -20.39771270751953, -14.779858589172363, -9.162004470825195, -3.5441513061523438, 2.0737037658691406, 7.691558837890625, 13.309410095214844, 18.927265167236328, 24.54510498046875, 30.162960052490234, 35.78081512451172, 41.39866638183594, 47.01652145385742, 52.634376525878906, 58.252227783203125, 63.87008285522461, 69.4879379272461, 75.10578918457031, 80.72364807128906, 86.34149932861328, 91.9593505859375, 97.57720947265625, 103.19506072998047, 108.81291198730469, 114.43077087402344, 120.04862213134766, 125.6664810180664, 131.28433227539062, 136.90219116210938, 142.52005004882812, 148.1378936767578, 153.75575256347656, 159.37359619140625, 164.991455078125, 170.6092987060547, 176.22715759277344, 181.8450164794922, 187.46286010742188, 193.08071899414062, 198.69857788085938, 204.31643676757812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 10.0, 11.0, 22.0, 12.0, 23.0, 30.0, 29.0, 32.0, 20.0, 29.0, 56.0, 59.0, 84.0, 82.0, 80.0, 50.0, 47.0, 42.0, 39.0, 37.0, 33.0, 41.0, 23.0, 17.0, 15.0, 9.0, 12.0, 7.0, 9.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0], "bins": [-104.61738586425781, -102.0246810913086, -99.43196868896484, -96.83926391601562, -94.24655151367188, -91.65384674072266, -89.06114196777344, -86.46842956542969, -83.87572479248047, -81.28302001953125, -78.6903076171875, -76.09760284423828, -73.50489807128906, -70.91218566894531, -68.3194808959961, -65.72677612304688, -63.134063720703125, -60.54135513305664, -57.948646545410156, -55.35594177246094, -52.76323318481445, -50.17052459716797, -47.57781982421875, -44.985111236572266, -42.39240264892578, -39.7996940612793, -37.20698547363281, -34.614280700683594, -32.02157211303711, -29.428863525390625, -26.836156845092773, -24.243450164794922, -21.650741577148438, -19.058032989501953, -16.4653263092041, -13.872618675231934, -11.279911041259766, -8.687203407287598, -6.09449577331543, -3.501789093017578, -0.9090805053710938, 1.6836271286010742, 4.276334762573242, 6.86904239654541, 9.461750030517578, 12.054457664489746, 14.647165298461914, 17.239871978759766, 19.83258056640625, 22.425289154052734, 25.017995834350586, 27.610702514648438, 30.203411102294922, 32.796119689941406, 35.388824462890625, 37.98153305053711, 40.574241638183594, 43.16695022583008, 45.75965881347656, 48.35236358642578, 50.945072174072266, 53.53778076171875, 56.13048553466797, 58.72319412231445, 61.31590270996094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 16.0, 16.0, 21.0, 30.0, 66.0, 91.0, 145.0, 271.0, 486.0, 1163.0, 2744.0, 8630.0, 42001.0, 742483.0, 3203506.0, 164209.0, 19792.0, 5186.0, 1825.0, 776.0, 368.0, 193.0, 105.0, 53.0, 35.0, 15.0, 14.0, 9.0, 11.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5408935546875, -11.183349609375, -10.8258056640625, -10.46826171875, -10.1107177734375, -9.753173828125, -9.3956298828125, -9.0380859375, -8.6805419921875, -8.322998046875, -7.9654541015625, -7.60791015625, -7.2503662109375, -6.892822265625, -6.5352783203125, -6.177734375, -5.8201904296875, -5.462646484375, -5.1051025390625, -4.74755859375, -4.3900146484375, -4.032470703125, -3.6749267578125, -3.3173828125, -2.9598388671875, -2.602294921875, -2.2447509765625, -1.88720703125, -1.5296630859375, -1.172119140625, -0.8145751953125, -0.45703125, -0.0994873046875, 0.258056640625, 0.6156005859375, 0.97314453125, 1.3306884765625, 1.688232421875, 2.0457763671875, 2.4033203125, 2.7608642578125, 3.118408203125, 3.4759521484375, 3.83349609375, 4.1910400390625, 4.548583984375, 4.9061279296875, 5.263671875, 5.6212158203125, 5.978759765625, 6.3363037109375, 6.69384765625, 7.0513916015625, 7.408935546875, 7.7664794921875, 8.1240234375, 8.4815673828125, 8.839111328125, 9.1966552734375, 9.55419921875, 9.9117431640625, 10.269287109375, 10.6268310546875, 10.984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 9.0, 12.0, 16.0, 8.0, 14.0, 27.0, 26.0, 31.0, 30.0, 37.0, 39.0, 42.0, 61.0, 46.0, 52.0, 59.0, 44.0, 48.0, 45.0, 45.0, 53.0, 37.0, 30.0, 31.0, 30.0, 20.0, 15.0, 14.0, 19.0, 10.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.14654541015625, -4.0001220703125, -3.85369873046875, -3.707275390625, -3.56085205078125, -3.4144287109375, -3.26800537109375, -3.12158203125, -2.97515869140625, -2.8287353515625, -2.68231201171875, -2.535888671875, -2.38946533203125, -2.2430419921875, -2.09661865234375, -1.9501953125, -1.80377197265625, -1.6573486328125, -1.51092529296875, -1.364501953125, -1.21807861328125, -1.0716552734375, -0.92523193359375, -0.77880859375, -0.63238525390625, -0.4859619140625, -0.33953857421875, -0.193115234375, -0.04669189453125, 0.0997314453125, 0.24615478515625, 0.392578125, 0.53900146484375, 0.6854248046875, 0.83184814453125, 0.978271484375, 1.12469482421875, 1.2711181640625, 1.41754150390625, 1.56396484375, 1.71038818359375, 1.8568115234375, 2.00323486328125, 2.149658203125, 2.29608154296875, 2.4425048828125, 2.58892822265625, 2.7353515625, 2.88177490234375, 3.0281982421875, 3.17462158203125, 3.321044921875, 3.46746826171875, 3.6138916015625, 3.76031494140625, 3.90673828125, 4.05316162109375, 4.1995849609375, 4.34600830078125, 4.492431640625, 4.63885498046875, 4.7852783203125, 4.93170166015625, 5.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 11.0, 6.0, 33.0, 57.0, 150.0, 342.0, 897.0, 4601.0, 124276.0, 4031977.0, 28044.0, 2685.0, 700.0, 279.0, 115.0, 53.0, 23.0, 16.0, 11.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.40625, -39.26220703125, -38.1181640625, -36.97412109375, -35.830078125, -34.68603515625, -33.5419921875, -32.39794921875, -31.25390625, -30.10986328125, -28.9658203125, -27.82177734375, -26.677734375, -25.53369140625, -24.3896484375, -23.24560546875, -22.1015625, -20.95751953125, -19.8134765625, -18.66943359375, -17.525390625, -16.38134765625, -15.2373046875, -14.09326171875, -12.94921875, -11.80517578125, -10.6611328125, -9.51708984375, -8.373046875, -7.22900390625, -6.0849609375, -4.94091796875, -3.796875, -2.65283203125, -1.5087890625, -0.36474609375, 0.779296875, 1.92333984375, 3.0673828125, 4.21142578125, 5.35546875, 6.49951171875, 7.6435546875, 8.78759765625, 9.931640625, 11.07568359375, 12.2197265625, 13.36376953125, 14.5078125, 15.65185546875, 16.7958984375, 17.93994140625, 19.083984375, 20.22802734375, 21.3720703125, 22.51611328125, 23.66015625, 24.80419921875, 25.9482421875, 27.09228515625, 28.236328125, 29.38037109375, 30.5244140625, 31.66845703125, 32.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 10.0, 6.0, 21.0, 51.0, 82.0, 190.0, 920.0, 1822.0, 635.0, 176.0, 83.0, 30.0, 20.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5, -28.615966796875, -27.73193359375, -26.847900390625, -25.9638671875, -25.079833984375, -24.19580078125, -23.311767578125, -22.427734375, -21.543701171875, -20.65966796875, -19.775634765625, -18.8916015625, -18.007568359375, -17.12353515625, -16.239501953125, -15.35546875, -14.471435546875, -13.58740234375, -12.703369140625, -11.8193359375, -10.935302734375, -10.05126953125, -9.167236328125, -8.283203125, -7.399169921875, -6.51513671875, -5.631103515625, -4.7470703125, -3.863037109375, -2.97900390625, -2.094970703125, -1.2109375, -0.326904296875, 0.55712890625, 1.441162109375, 2.3251953125, 3.209228515625, 4.09326171875, 4.977294921875, 5.861328125, 6.745361328125, 7.62939453125, 8.513427734375, 9.3974609375, 10.281494140625, 11.16552734375, 12.049560546875, 12.93359375, 13.817626953125, 14.70166015625, 15.585693359375, 16.4697265625, 17.353759765625, 18.23779296875, 19.121826171875, 20.005859375, 20.889892578125, 21.77392578125, 22.657958984375, 23.5419921875, 24.426025390625, 25.31005859375, 26.194091796875, 27.078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 13.0, 25.0, 91.0, 285.0, 344.0, 165.0, 43.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.77316284179688, -130.68785095214844, -122.60254669189453, -114.51724243164062, -106.43193054199219, -98.34661865234375, -90.26131439208984, -82.17601013183594, -74.0906982421875, -66.00538635253906, -57.920082092285156, -49.834774017333984, -41.74946594238281, -33.66415786743164, -25.57884979248047, -17.493541717529297, -9.408233642578125, -1.3229255676269531, 6.762382507324219, 14.84769058227539, 22.932998657226562, 31.018306732177734, 39.103614807128906, 47.18892288208008, 55.27423095703125, 63.35953903198242, 71.4448471069336, 79.5301513671875, 87.61546325683594, 95.70077514648438, 103.78607940673828, 111.87138366699219, 119.95672607421875, 128.0420379638672, 136.12734985351562, 144.212646484375, 152.29795837402344, 160.38327026367188, 168.46856689453125, 176.5538787841797, 184.63919067382812, 192.72450256347656, 200.809814453125, 208.89511108398438, 216.9804229736328, 225.06573486328125, 233.15103149414062, 241.23634338378906, 249.3216552734375, 257.4069519042969, 265.4922790527344, 273.57757568359375, 281.66290283203125, 289.7481994628906, 297.83349609375, 305.9188232421875, 314.0041198730469, 322.08941650390625, 330.17474365234375, 338.2600402832031, 346.3453369140625, 354.4306640625, 362.5159606933594, 370.6012878417969, 378.68658447265625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 8.0, 8.0, 17.0, 17.0, 24.0, 39.0, 41.0, 47.0, 46.0, 49.0, 55.0, 67.0, 66.0, 78.0, 56.0, 78.0, 63.0, 46.0, 42.0, 26.0, 32.0, 27.0, 18.0, 16.0, 10.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.17898559570312, -99.54145812988281, -96.90392303466797, -94.26639556884766, -91.62886810302734, -88.9913330078125, -86.35380554199219, -83.71627807617188, -81.07874298095703, -78.44121551513672, -75.80368041992188, -73.16615295410156, -70.52862548828125, -67.8910903930664, -65.2535629272461, -62.616031646728516, -59.9785041809082, -57.340972900390625, -54.70344543457031, -52.065914154052734, -49.428382873535156, -46.790855407714844, -44.153324127197266, -41.51579284667969, -38.878265380859375, -36.2407341003418, -33.603206634521484, -30.965675354003906, -28.328144073486328, -25.690614700317383, -23.053085327148438, -20.41555404663086, -17.77802276611328, -15.14049243927002, -12.502962112426758, -9.865432739257812, -7.227902412414551, -4.590372085571289, -1.9528427124023438, 0.6846885681152344, 3.3222179412841797, 5.959748268127441, 8.597278594970703, 11.234807968139648, 13.87233829498291, 16.509868621826172, 19.147397994995117, 21.784929275512695, 24.42245864868164, 27.059988021850586, 29.697519302368164, 32.33504867553711, 34.97257995605469, 37.610107421875, 40.24763870239258, 42.885169982910156, 45.52269744873047, 48.16022872924805, 50.79775619506836, 53.43528747558594, 56.072818756103516, 58.710350036621094, 61.347877502441406, 63.985408782958984, 66.62294006347656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 15.0, 18.0, 28.0, 44.0, 55.0, 101.0, 164.0, 297.0, 555.0, 984.0, 2089.0, 4274.0, 10290.0, 27474.0, 85241.0, 266090.0, 393718.0, 171970.0, 53431.0, 18260.0, 7083.0, 3051.0, 1533.0, 780.0, 391.0, 224.0, 145.0, 81.0, 58.0, 28.0, 21.0, 19.0, 16.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.37060546875, -7.1005859375, -6.83056640625, -6.560546875, -6.29052734375, -6.0205078125, -5.75048828125, -5.48046875, -5.21044921875, -4.9404296875, -4.67041015625, -4.400390625, -4.13037109375, -3.8603515625, -3.59033203125, -3.3203125, -3.05029296875, -2.7802734375, -2.51025390625, -2.240234375, -1.97021484375, -1.7001953125, -1.43017578125, -1.16015625, -0.89013671875, -0.6201171875, -0.35009765625, -0.080078125, 0.18994140625, 0.4599609375, 0.72998046875, 1.0, 1.27001953125, 1.5400390625, 1.81005859375, 2.080078125, 2.35009765625, 2.6201171875, 2.89013671875, 3.16015625, 3.43017578125, 3.7001953125, 3.97021484375, 4.240234375, 4.51025390625, 4.7802734375, 5.05029296875, 5.3203125, 5.59033203125, 5.8603515625, 6.13037109375, 6.400390625, 6.67041015625, 6.9404296875, 7.21044921875, 7.48046875, 7.75048828125, 8.0205078125, 8.29052734375, 8.560546875, 8.83056640625, 9.1005859375, 9.37060546875, 9.640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 15.0, 16.0, 19.0, 19.0, 36.0, 34.0, 43.0, 48.0, 39.0, 52.0, 57.0, 59.0, 54.0, 77.0, 40.0, 70.0, 47.0, 56.0, 37.0, 33.0, 25.0, 30.0, 16.0, 16.0, 11.0, 7.0, 5.0, 10.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.7191162109375, -7.512451171875, -7.3057861328125, -7.09912109375, -6.8924560546875, -6.685791015625, -6.4791259765625, -6.2724609375, -6.0657958984375, -5.859130859375, -5.6524658203125, -5.44580078125, -5.2391357421875, -5.032470703125, -4.8258056640625, -4.619140625, -4.4124755859375, -4.205810546875, -3.9991455078125, -3.79248046875, -3.5858154296875, -3.379150390625, -3.1724853515625, -2.9658203125, -2.7591552734375, -2.552490234375, -2.3458251953125, -2.13916015625, -1.9324951171875, -1.725830078125, -1.5191650390625, -1.3125, -1.1058349609375, -0.899169921875, -0.6925048828125, -0.48583984375, -0.2791748046875, -0.072509765625, 0.1341552734375, 0.3408203125, 0.5474853515625, 0.754150390625, 0.9608154296875, 1.16748046875, 1.3741455078125, 1.580810546875, 1.7874755859375, 1.994140625, 2.2008056640625, 2.407470703125, 2.6141357421875, 2.82080078125, 3.0274658203125, 3.234130859375, 3.4407958984375, 3.6474609375, 3.8541259765625, 4.060791015625, 4.2674560546875, 4.47412109375, 4.6807861328125, 4.887451171875, 5.0941162109375, 5.30078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 26.0, 20.0, 30.0, 60.0, 82.0, 137.0, 222.0, 420.0, 800.0, 1996.0, 5767.0, 21730.0, 127983.0, 691780.0, 160577.0, 26117.0, 6490.0, 2193.0, 944.0, 448.0, 259.0, 138.0, 93.0, 51.0, 40.0, 31.0, 23.0, 19.0, 4.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.2734375, -14.7894287109375, -14.305419921875, -13.8214111328125, -13.33740234375, -12.8533935546875, -12.369384765625, -11.8853759765625, -11.4013671875, -10.9173583984375, -10.433349609375, -9.9493408203125, -9.46533203125, -8.9813232421875, -8.497314453125, -8.0133056640625, -7.529296875, -7.0452880859375, -6.561279296875, -6.0772705078125, -5.59326171875, -5.1092529296875, -4.625244140625, -4.1412353515625, -3.6572265625, -3.1732177734375, -2.689208984375, -2.2052001953125, -1.72119140625, -1.2371826171875, -0.753173828125, -0.2691650390625, 0.21484375, 0.6988525390625, 1.182861328125, 1.6668701171875, 2.15087890625, 2.6348876953125, 3.118896484375, 3.6029052734375, 4.0869140625, 4.5709228515625, 5.054931640625, 5.5389404296875, 6.02294921875, 6.5069580078125, 6.990966796875, 7.4749755859375, 7.958984375, 8.4429931640625, 8.927001953125, 9.4110107421875, 9.89501953125, 10.3790283203125, 10.863037109375, 11.3470458984375, 11.8310546875, 12.3150634765625, 12.799072265625, 13.2830810546875, 13.76708984375, 14.2510986328125, 14.735107421875, 15.2191162109375, 15.703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 15.0, 8.0, 10.0, 20.0, 25.0, 21.0, 36.0, 39.0, 45.0, 54.0, 54.0, 52.0, 52.0, 65.0, 55.0, 54.0, 49.0, 50.0, 51.0, 37.0, 21.0, 28.0, 26.0, 24.0, 16.0, 16.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.673583984375, -24.95654296875, -24.239501953125, -23.5224609375, -22.805419921875, -22.08837890625, -21.371337890625, -20.654296875, -19.937255859375, -19.22021484375, -18.503173828125, -17.7861328125, -17.069091796875, -16.35205078125, -15.635009765625, -14.91796875, -14.200927734375, -13.48388671875, -12.766845703125, -12.0498046875, -11.332763671875, -10.61572265625, -9.898681640625, -9.181640625, -8.464599609375, -7.74755859375, -7.030517578125, -6.3134765625, -5.596435546875, -4.87939453125, -4.162353515625, -3.4453125, -2.728271484375, -2.01123046875, -1.294189453125, -0.5771484375, 0.139892578125, 0.85693359375, 1.573974609375, 2.291015625, 3.008056640625, 3.72509765625, 4.442138671875, 5.1591796875, 5.876220703125, 6.59326171875, 7.310302734375, 8.02734375, 8.744384765625, 9.46142578125, 10.178466796875, 10.8955078125, 11.612548828125, 12.32958984375, 13.046630859375, 13.763671875, 14.480712890625, 15.19775390625, 15.914794921875, 16.6318359375, 17.348876953125, 18.06591796875, 18.782958984375, 19.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 10.0, 9.0, 11.0, 35.0, 33.0, 53.0, 69.0, 101.0, 119.0, 216.0, 301.0, 458.0, 733.0, 1219.0, 2333.0, 5059.0, 12771.0, 43554.0, 239220.0, 632233.0, 75895.0, 19634.0, 7269.0, 3221.0, 1630.0, 875.0, 487.0, 327.0, 209.0, 141.0, 76.0, 66.0, 44.0, 44.0, 29.0, 19.0, 11.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.82952880859375, -4.6746826171875, -4.51983642578125, -4.364990234375, -4.21014404296875, -4.0552978515625, -3.90045166015625, -3.74560546875, -3.59075927734375, -3.4359130859375, -3.28106689453125, -3.126220703125, -2.97137451171875, -2.8165283203125, -2.66168212890625, -2.5068359375, -2.35198974609375, -2.1971435546875, -2.04229736328125, -1.887451171875, -1.73260498046875, -1.5777587890625, -1.42291259765625, -1.26806640625, -1.11322021484375, -0.9583740234375, -0.80352783203125, -0.648681640625, -0.49383544921875, -0.3389892578125, -0.18414306640625, -0.029296875, 0.12554931640625, 0.2803955078125, 0.43524169921875, 0.590087890625, 0.74493408203125, 0.8997802734375, 1.05462646484375, 1.20947265625, 1.36431884765625, 1.5191650390625, 1.67401123046875, 1.828857421875, 1.98370361328125, 2.1385498046875, 2.29339599609375, 2.4482421875, 2.60308837890625, 2.7579345703125, 2.91278076171875, 3.067626953125, 3.22247314453125, 3.3773193359375, 3.53216552734375, 3.68701171875, 3.84185791015625, 3.9967041015625, 4.15155029296875, 4.306396484375, 4.46124267578125, 4.6160888671875, 4.77093505859375, 4.92578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 24.0, 27.0, 74.0, 163.0, 330.0, 182.0, 90.0, 41.0, 17.0, 11.0, 5.0, 9.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00299072265625, -0.0029015839099884033, -0.0028124451637268066, -0.00272330641746521, -0.0026341676712036133, -0.0025450289249420166, -0.00245589017868042, -0.0023667514324188232, -0.0022776126861572266, -0.00218847393989563, -0.002099335193634033, -0.0020101964473724365, -0.0019210577011108398, -0.0018319189548492432, -0.0017427802085876465, -0.0016536414623260498, -0.0015645027160644531, -0.0014753639698028564, -0.0013862252235412598, -0.001297086477279663, -0.0012079477310180664, -0.0011188089847564697, -0.001029670238494873, -0.0009405314922332764, -0.0008513927459716797, -0.000762253999710083, -0.0006731152534484863, -0.0005839765071868896, -0.000494837760925293, -0.0004056990146636963, -0.0003165602684020996, -0.00022742152214050293, -0.00013828277587890625, -4.914402961730957e-05, 3.999471664428711e-05, 0.0001291334629058838, 0.00021827220916748047, 0.00030741095542907715, 0.00039654970169067383, 0.0004856884479522705, 0.0005748271942138672, 0.0006639659404754639, 0.0007531046867370605, 0.0008422434329986572, 0.0009313821792602539, 0.0010205209255218506, 0.0011096596717834473, 0.001198798418045044, 0.0012879371643066406, 0.0013770759105682373, 0.001466214656829834, 0.0015553534030914307, 0.0016444921493530273, 0.001733630895614624, 0.0018227696418762207, 0.0019119083881378174, 0.002001047134399414, 0.0020901858806610107, 0.0021793246269226074, 0.002268463373184204, 0.0023576021194458008, 0.0024467408657073975, 0.002535879611968994, 0.002625018358230591, 0.0027141571044921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 7.0, 19.0, 24.0, 40.0, 73.0, 143.0, 405.0, 1040.0, 3237.0, 13338.0, 91813.0, 804966.0, 112503.0, 15328.0, 3649.0, 1134.0, 431.0, 170.0, 83.0, 55.0, 25.0, 21.0, 8.0, 7.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.17047119140625, -7.9268798828125, -7.68328857421875, -7.439697265625, -7.19610595703125, -6.9525146484375, -6.70892333984375, -6.46533203125, -6.22174072265625, -5.9781494140625, -5.73455810546875, -5.490966796875, -5.24737548828125, -5.0037841796875, -4.76019287109375, -4.5166015625, -4.27301025390625, -4.0294189453125, -3.78582763671875, -3.542236328125, -3.29864501953125, -3.0550537109375, -2.81146240234375, -2.56787109375, -2.32427978515625, -2.0806884765625, -1.83709716796875, -1.593505859375, -1.34991455078125, -1.1063232421875, -0.86273193359375, -0.619140625, -0.37554931640625, -0.1319580078125, 0.11163330078125, 0.355224609375, 0.59881591796875, 0.8424072265625, 1.08599853515625, 1.32958984375, 1.57318115234375, 1.8167724609375, 2.06036376953125, 2.303955078125, 2.54754638671875, 2.7911376953125, 3.03472900390625, 3.2783203125, 3.52191162109375, 3.7655029296875, 4.00909423828125, 4.252685546875, 4.49627685546875, 4.7398681640625, 4.98345947265625, 5.22705078125, 5.47064208984375, 5.7142333984375, 5.95782470703125, 6.201416015625, 6.44500732421875, 6.6885986328125, 6.93218994140625, 7.17578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 14.0, 17.0, 26.0, 38.0, 54.0, 72.0, 98.0, 120.0, 131.0, 100.0, 68.0, 71.0, 32.0, 19.0, 25.0, 21.0, 9.0, 6.0, 6.0, 7.0, 7.0, 10.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.3203125, -8.12255859375, -7.9248046875, -7.72705078125, -7.529296875, -7.33154296875, -7.1337890625, -6.93603515625, -6.73828125, -6.54052734375, -6.3427734375, -6.14501953125, -5.947265625, -5.74951171875, -5.5517578125, -5.35400390625, -5.15625, -4.95849609375, -4.7607421875, -4.56298828125, -4.365234375, -4.16748046875, -3.9697265625, -3.77197265625, -3.57421875, -3.37646484375, -3.1787109375, -2.98095703125, -2.783203125, -2.58544921875, -2.3876953125, -2.18994140625, -1.9921875, -1.79443359375, -1.5966796875, -1.39892578125, -1.201171875, -1.00341796875, -0.8056640625, -0.60791015625, -0.41015625, -0.21240234375, -0.0146484375, 0.18310546875, 0.380859375, 0.57861328125, 0.7763671875, 0.97412109375, 1.171875, 1.36962890625, 1.5673828125, 1.76513671875, 1.962890625, 2.16064453125, 2.3583984375, 2.55615234375, 2.75390625, 2.95166015625, 3.1494140625, 3.34716796875, 3.544921875, 3.74267578125, 3.9404296875, 4.13818359375, 4.3359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 15.0, 41.0, 210.0, 482.0, 177.0, 43.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.50439453125, -351.2229309082031, -342.9414978027344, -334.6600341796875, -326.37860107421875, -318.0971374511719, -309.815673828125, -301.53424072265625, -293.2527770996094, -284.9713134765625, -276.68988037109375, -268.4084167480469, -260.1269836425781, -251.84552001953125, -243.56407165527344, -235.28262329101562, -227.0011749267578, -218.7197265625, -210.4382781982422, -202.15682983398438, -193.8753662109375, -185.5939178466797, -177.31246948242188, -169.03102111816406, -160.74957275390625, -152.46812438964844, -144.18667602539062, -135.90521240234375, -127.62376403808594, -119.34231567382812, -111.06086730957031, -102.7794189453125, -94.49795532226562, -86.21650695800781, -77.93505096435547, -69.65360260009766, -61.37215042114258, -53.0906982421875, -44.80924987792969, -36.52779769897461, -28.24634552001953, -19.964893341064453, -11.683443069458008, -3.4019927978515625, 4.879459381103516, 13.160911560058594, 21.442359924316406, 29.723812103271484, 38.00526428222656, 46.28671646118164, 54.56816864013672, 62.84961700439453, 71.13107299804688, 79.41252136230469, 87.6939697265625, 95.97541809082031, 104.25687408447266, 112.53832244873047, 120.81977844238281, 129.10122680664062, 137.38267517089844, 145.66412353515625, 153.94558715820312, 162.22703552246094, 170.50848388671875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 16.0, 19.0, 16.0, 17.0, 26.0, 27.0, 30.0, 44.0, 48.0, 48.0, 80.0, 105.0, 95.0, 89.0, 52.0, 45.0, 44.0, 24.0, 34.0, 23.0, 28.0, 18.0, 14.0, 14.0, 10.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.67813110351562, -73.49794006347656, -70.3177490234375, -67.13755798339844, -63.95736312866211, -60.77717208862305, -57.596981048583984, -54.416786193847656, -51.236595153808594, -48.05640411376953, -44.87621307373047, -41.696022033691406, -38.51582717895508, -35.335636138916016, -32.15544509887695, -28.975252151489258, -25.795063018798828, -22.614871978759766, -19.43467903137207, -16.254487991333008, -13.074295997619629, -9.89410400390625, -6.7139129638671875, -3.533720016479492, -0.3535289764404297, 2.82666277885437, 6.00685453414917, 9.18704605102539, 12.36723804473877, 15.547430038452148, 18.72762107849121, 21.907814025878906, 25.08800506591797, 28.26819610595703, 31.448389053344727, 34.628578186035156, 37.808773040771484, 40.98896408081055, 44.16915512084961, 47.34934997558594, 50.529541015625, 53.70973205566406, 56.889923095703125, 60.07011413574219, 63.250308990478516, 66.43049621582031, 69.61068725585938, 72.79088592529297, 75.9710693359375, 79.15126037597656, 82.33145141601562, 85.51164245605469, 88.69183349609375, 91.87202453613281, 95.05221557617188, 98.23241424560547, 101.41260528564453, 104.5927963256836, 107.77298736572266, 110.95317840576172, 114.13336944580078, 117.31356811523438, 120.49375915527344, 123.6739501953125, 126.85414123535156]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 15.0, 26.0, 36.0, 41.0, 57.0, 99.0, 130.0, 195.0, 256.0, 388.0, 521.0, 896.0, 1578.0, 2946.0, 6910.0, 20706.0, 96255.0, 663163.0, 2493862.0, 758812.0, 109318.0, 22972.0, 7460.0, 3163.0, 1684.0, 947.0, 596.0, 359.0, 252.0, 188.0, 117.0, 75.0, 62.0, 40.0, 31.0, 19.0, 17.0, 11.0, 10.0, 8.0, 3.0, 7.0, 3.0, 7.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.546875, -6.3572998046875, -6.167724609375, -5.9781494140625, -5.78857421875, -5.5989990234375, -5.409423828125, -5.2198486328125, -5.0302734375, -4.8406982421875, -4.651123046875, -4.4615478515625, -4.27197265625, -4.0823974609375, -3.892822265625, -3.7032470703125, -3.513671875, -3.3240966796875, -3.134521484375, -2.9449462890625, -2.75537109375, -2.5657958984375, -2.376220703125, -2.1866455078125, -1.9970703125, -1.8074951171875, -1.617919921875, -1.4283447265625, -1.23876953125, -1.0491943359375, -0.859619140625, -0.6700439453125, -0.48046875, -0.2908935546875, -0.101318359375, 0.0882568359375, 0.27783203125, 0.4674072265625, 0.656982421875, 0.8465576171875, 1.0361328125, 1.2257080078125, 1.415283203125, 1.6048583984375, 1.79443359375, 1.9840087890625, 2.173583984375, 2.3631591796875, 2.552734375, 2.7423095703125, 2.931884765625, 3.1214599609375, 3.31103515625, 3.5006103515625, 3.690185546875, 3.8797607421875, 4.0693359375, 4.2589111328125, 4.448486328125, 4.6380615234375, 4.82763671875, 5.0172119140625, 5.206787109375, 5.3963623046875, 5.5859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 9.0, 3.0, 11.0, 7.0, 10.0, 7.0, 14.0, 16.0, 19.0, 24.0, 34.0, 18.0, 24.0, 33.0, 46.0, 39.0, 40.0, 38.0, 51.0, 52.0, 43.0, 43.0, 40.0, 48.0, 34.0, 34.0, 29.0, 31.0, 32.0, 27.0, 36.0, 15.0, 14.0, 17.0, 10.0, 11.0, 15.0, 11.0, 4.0, 2.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.95703125, -4.80810546875, -4.6591796875, -4.51025390625, -4.361328125, -4.21240234375, -4.0634765625, -3.91455078125, -3.765625, -3.61669921875, -3.4677734375, -3.31884765625, -3.169921875, -3.02099609375, -2.8720703125, -2.72314453125, -2.57421875, -2.42529296875, -2.2763671875, -2.12744140625, -1.978515625, -1.82958984375, -1.6806640625, -1.53173828125, -1.3828125, -1.23388671875, -1.0849609375, -0.93603515625, -0.787109375, -0.63818359375, -0.4892578125, -0.34033203125, -0.19140625, -0.04248046875, 0.1064453125, 0.25537109375, 0.404296875, 0.55322265625, 0.7021484375, 0.85107421875, 1.0, 1.14892578125, 1.2978515625, 1.44677734375, 1.595703125, 1.74462890625, 1.8935546875, 2.04248046875, 2.19140625, 2.34033203125, 2.4892578125, 2.63818359375, 2.787109375, 2.93603515625, 3.0849609375, 3.23388671875, 3.3828125, 3.53173828125, 3.6806640625, 3.82958984375, 3.978515625, 4.12744140625, 4.2763671875, 4.42529296875, 4.57421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 19.0, 27.0, 82.0, 254.0, 1078.0, 19614.0, 4142688.0, 28708.0, 1289.0, 326.0, 111.0, 46.0, 23.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.33544921875, -39.0146484375, -37.69384765625, -36.373046875, -35.05224609375, -33.7314453125, -32.41064453125, -31.08984375, -29.76904296875, -28.4482421875, -27.12744140625, -25.806640625, -24.48583984375, -23.1650390625, -21.84423828125, -20.5234375, -19.20263671875, -17.8818359375, -16.56103515625, -15.240234375, -13.91943359375, -12.5986328125, -11.27783203125, -9.95703125, -8.63623046875, -7.3154296875, -5.99462890625, -4.673828125, -3.35302734375, -2.0322265625, -0.71142578125, 0.609375, 1.93017578125, 3.2509765625, 4.57177734375, 5.892578125, 7.21337890625, 8.5341796875, 9.85498046875, 11.17578125, 12.49658203125, 13.8173828125, 15.13818359375, 16.458984375, 17.77978515625, 19.1005859375, 20.42138671875, 21.7421875, 23.06298828125, 24.3837890625, 25.70458984375, 27.025390625, 28.34619140625, 29.6669921875, 30.98779296875, 32.30859375, 33.62939453125, 34.9501953125, 36.27099609375, 37.591796875, 38.91259765625, 40.2333984375, 41.55419921875, 42.875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 6.0, 11.0, 12.0, 17.0, 34.0, 54.0, 109.0, 203.0, 440.0, 875.0, 1041.0, 590.0, 319.0, 145.0, 81.0, 43.0, 19.0, 26.0, 15.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.4649658203125, -7.031494140625, -6.5980224609375, -6.16455078125, -5.7310791015625, -5.297607421875, -4.8641357421875, -4.4306640625, -3.9971923828125, -3.563720703125, -3.1302490234375, -2.69677734375, -2.2633056640625, -1.829833984375, -1.3963623046875, -0.962890625, -0.5294189453125, -0.095947265625, 0.3375244140625, 0.77099609375, 1.2044677734375, 1.637939453125, 2.0714111328125, 2.5048828125, 2.9383544921875, 3.371826171875, 3.8052978515625, 4.23876953125, 4.6722412109375, 5.105712890625, 5.5391845703125, 5.97265625, 6.4061279296875, 6.839599609375, 7.2730712890625, 7.70654296875, 8.1400146484375, 8.573486328125, 9.0069580078125, 9.4404296875, 9.8739013671875, 10.307373046875, 10.7408447265625, 11.17431640625, 11.6077880859375, 12.041259765625, 12.4747314453125, 12.908203125, 13.3416748046875, 13.775146484375, 14.2086181640625, 14.64208984375, 15.0755615234375, 15.509033203125, 15.9425048828125, 16.3759765625, 16.8094482421875, 17.242919921875, 17.6763916015625, 18.10986328125, 18.5433349609375, 18.976806640625, 19.4102783203125, 19.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 26.0, 110.0, 333.0, 313.0, 128.0, 48.0, 13.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.99601745605469, -77.53012084960938, -71.06421661376953, -64.59831237792969, -58.132415771484375, -51.6665153503418, -45.20061492919922, -38.73471450805664, -32.26881408691406, -25.802913665771484, -19.337013244628906, -12.871112823486328, -6.40521240234375, 0.060688018798828125, 6.526588439941406, 12.992488861083984, 19.458389282226562, 25.92428970336914, 32.39019012451172, 38.8560905456543, 45.321990966796875, 51.78789138793945, 58.25379180908203, 64.71969604492188, 71.18559265136719, 77.6514892578125, 84.11739349365234, 90.58329772949219, 97.0491943359375, 103.51509094238281, 109.98099517822266, 116.4468994140625, 122.91278076171875, 129.37867736816406, 135.84457397460938, 142.31048583984375, 148.77638244628906, 155.24227905273438, 161.70819091796875, 168.17408752441406, 174.63998413085938, 181.1058807373047, 187.57177734375, 194.03768920898438, 200.5035858154297, 206.969482421875, 213.43539428710938, 219.9012908935547, 226.3671875, 232.8330841064453, 239.29898071289062, 245.764892578125, 252.2307891845703, 258.6966857910156, 265.16259765625, 271.62847900390625, 278.0943908691406, 284.560302734375, 291.02618408203125, 297.4920959472656, 303.9580078125, 310.42388916015625, 316.8898010253906, 323.3556823730469, 329.82159423828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 37.0, 37.0, 45.0, 43.0, 64.0, 66.0, 60.0, 64.0, 46.0, 57.0, 51.0, 49.0, 45.0, 39.0, 48.0, 33.0, 30.0, 10.0, 11.0, 12.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.43990325927734, -66.47781372070312, -64.5157241821289, -62.55363082885742, -60.5915412902832, -58.629451751708984, -56.6673583984375, -54.70526885986328, -52.74317932128906, -50.781089782714844, -48.819000244140625, -46.85690689086914, -44.89481735229492, -42.9327278137207, -40.97063446044922, -39.008544921875, -37.04645538330078, -35.08436584472656, -33.122276306152344, -31.16018295288086, -29.19809341430664, -27.236003875732422, -25.27391242980957, -23.31182098388672, -21.3497314453125, -19.38764190673828, -17.42555046081543, -15.463459968566895, -13.50136947631836, -11.539278984069824, -9.577188491821289, -7.615097999572754, -5.653011322021484, -3.690920829772949, -1.728830337524414, 0.2332601547241211, 2.1953506469726562, 4.157441139221191, 6.119531631469727, 8.081622123718262, 10.043712615966797, 12.005803108215332, 13.967893600463867, 15.929984092712402, 17.892074584960938, 19.854164123535156, 21.816255569458008, 23.77834701538086, 25.740436553955078, 27.702526092529297, 29.66461753845215, 31.626708984375, 33.58879852294922, 35.55088806152344, 37.512977600097656, 39.47507095336914, 41.43716049194336, 43.39925003051758, 45.36134338378906, 47.32343292236328, 49.2855224609375, 51.24761199951172, 53.20970153808594, 55.17179489135742, 57.13388442993164]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 3.0, 8.0, 20.0, 31.0, 28.0, 30.0, 57.0, 103.0, 159.0, 262.0, 418.0, 712.0, 1280.0, 2398.0, 4608.0, 8989.0, 19458.0, 44098.0, 105905.0, 242760.0, 313887.0, 173316.0, 71582.0, 30382.0, 13844.0, 6628.0, 3377.0, 1775.0, 959.0, 600.0, 312.0, 212.0, 120.0, 65.0, 48.0, 37.0, 18.0, 16.0, 12.0, 11.0, 10.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.86328125, -4.68499755859375, -4.5067138671875, -4.32843017578125, -4.150146484375, -3.97186279296875, -3.7935791015625, -3.61529541015625, -3.43701171875, -3.25872802734375, -3.0804443359375, -2.90216064453125, -2.723876953125, -2.54559326171875, -2.3673095703125, -2.18902587890625, -2.0107421875, -1.83245849609375, -1.6541748046875, -1.47589111328125, -1.297607421875, -1.11932373046875, -0.9410400390625, -0.76275634765625, -0.58447265625, -0.40618896484375, -0.2279052734375, -0.04962158203125, 0.128662109375, 0.30694580078125, 0.4852294921875, 0.66351318359375, 0.841796875, 1.02008056640625, 1.1983642578125, 1.37664794921875, 1.554931640625, 1.73321533203125, 1.9114990234375, 2.08978271484375, 2.26806640625, 2.44635009765625, 2.6246337890625, 2.80291748046875, 2.981201171875, 3.15948486328125, 3.3377685546875, 3.51605224609375, 3.6943359375, 3.87261962890625, 4.0509033203125, 4.22918701171875, 4.407470703125, 4.58575439453125, 4.7640380859375, 4.94232177734375, 5.12060546875, 5.29888916015625, 5.4771728515625, 5.65545654296875, 5.833740234375, 6.01202392578125, 6.1903076171875, 6.36859130859375, 6.546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 9.0, 9.0, 13.0, 11.0, 17.0, 17.0, 12.0, 19.0, 20.0, 18.0, 17.0, 26.0, 26.0, 40.0, 29.0, 34.0, 34.0, 30.0, 38.0, 43.0, 32.0, 41.0, 28.0, 43.0, 30.0, 37.0, 25.0, 27.0, 44.0, 27.0, 26.0, 25.0, 22.0, 10.0, 14.0, 13.0, 15.0, 10.0, 7.0, 14.0, 6.0, 4.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.20703125, -4.07733154296875, -3.9476318359375, -3.81793212890625, -3.688232421875, -3.55853271484375, -3.4288330078125, -3.29913330078125, -3.16943359375, -3.03973388671875, -2.9100341796875, -2.78033447265625, -2.650634765625, -2.52093505859375, -2.3912353515625, -2.26153564453125, -2.1318359375, -2.00213623046875, -1.8724365234375, -1.74273681640625, -1.613037109375, -1.48333740234375, -1.3536376953125, -1.22393798828125, -1.09423828125, -0.96453857421875, -0.8348388671875, -0.70513916015625, -0.575439453125, -0.44573974609375, -0.3160400390625, -0.18634033203125, -0.056640625, 0.07305908203125, 0.2027587890625, 0.33245849609375, 0.462158203125, 0.59185791015625, 0.7215576171875, 0.85125732421875, 0.98095703125, 1.11065673828125, 1.2403564453125, 1.37005615234375, 1.499755859375, 1.62945556640625, 1.7591552734375, 1.88885498046875, 2.0185546875, 2.14825439453125, 2.2779541015625, 2.40765380859375, 2.537353515625, 2.66705322265625, 2.7967529296875, 2.92645263671875, 3.05615234375, 3.18585205078125, 3.3155517578125, 3.44525146484375, 3.574951171875, 3.70465087890625, 3.8343505859375, 3.96405029296875, 4.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 13.0, 16.0, 25.0, 38.0, 45.0, 79.0, 107.0, 148.0, 235.0, 386.0, 679.0, 1332.0, 3720.0, 14898.0, 102866.0, 767625.0, 131074.0, 17632.0, 4225.0, 1495.0, 696.0, 411.0, 265.0, 148.0, 96.0, 71.0, 53.0, 42.0, 27.0, 27.0, 21.0, 8.0, 14.0, 7.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.220458984375, -15.72216796875, -15.223876953125, -14.7255859375, -14.227294921875, -13.72900390625, -13.230712890625, -12.732421875, -12.234130859375, -11.73583984375, -11.237548828125, -10.7392578125, -10.240966796875, -9.74267578125, -9.244384765625, -8.74609375, -8.247802734375, -7.74951171875, -7.251220703125, -6.7529296875, -6.254638671875, -5.75634765625, -5.258056640625, -4.759765625, -4.261474609375, -3.76318359375, -3.264892578125, -2.7666015625, -2.268310546875, -1.77001953125, -1.271728515625, -0.7734375, -0.275146484375, 0.22314453125, 0.721435546875, 1.2197265625, 1.718017578125, 2.21630859375, 2.714599609375, 3.212890625, 3.711181640625, 4.20947265625, 4.707763671875, 5.2060546875, 5.704345703125, 6.20263671875, 6.700927734375, 7.19921875, 7.697509765625, 8.19580078125, 8.694091796875, 9.1923828125, 9.690673828125, 10.18896484375, 10.687255859375, 11.185546875, 11.683837890625, 12.18212890625, 12.680419921875, 13.1787109375, 13.677001953125, 14.17529296875, 14.673583984375, 15.171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 12.0, 18.0, 18.0, 29.0, 25.0, 24.0, 31.0, 48.0, 59.0, 48.0, 59.0, 48.0, 69.0, 67.0, 51.0, 52.0, 54.0, 42.0, 32.0, 33.0, 39.0, 24.0, 22.0, 13.0, 11.0, 15.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.594970703125, -20.89306640625, -20.191162109375, -19.4892578125, -18.787353515625, -18.08544921875, -17.383544921875, -16.681640625, -15.979736328125, -15.27783203125, -14.575927734375, -13.8740234375, -13.172119140625, -12.47021484375, -11.768310546875, -11.06640625, -10.364501953125, -9.66259765625, -8.960693359375, -8.2587890625, -7.556884765625, -6.85498046875, -6.153076171875, -5.451171875, -4.749267578125, -4.04736328125, -3.345458984375, -2.6435546875, -1.941650390625, -1.23974609375, -0.537841796875, 0.1640625, 0.865966796875, 1.56787109375, 2.269775390625, 2.9716796875, 3.673583984375, 4.37548828125, 5.077392578125, 5.779296875, 6.481201171875, 7.18310546875, 7.885009765625, 8.5869140625, 9.288818359375, 9.99072265625, 10.692626953125, 11.39453125, 12.096435546875, 12.79833984375, 13.500244140625, 14.2021484375, 14.904052734375, 15.60595703125, 16.307861328125, 17.009765625, 17.711669921875, 18.41357421875, 19.115478515625, 19.8173828125, 20.519287109375, 21.22119140625, 21.923095703125, 22.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 13.0, 20.0, 25.0, 48.0, 95.0, 246.0, 826.0, 3844.0, 33458.0, 925655.0, 76146.0, 6418.0, 1185.0, 336.0, 114.0, 48.0, 24.0, 17.0, 5.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.8321533203125, -10.500244140625, -10.1683349609375, -9.83642578125, -9.5045166015625, -9.172607421875, -8.8406982421875, -8.5087890625, -8.1768798828125, -7.844970703125, -7.5130615234375, -7.18115234375, -6.8492431640625, -6.517333984375, -6.1854248046875, -5.853515625, -5.5216064453125, -5.189697265625, -4.8577880859375, -4.52587890625, -4.1939697265625, -3.862060546875, -3.5301513671875, -3.1982421875, -2.8663330078125, -2.534423828125, -2.2025146484375, -1.87060546875, -1.5386962890625, -1.206787109375, -0.8748779296875, -0.54296875, -0.2110595703125, 0.120849609375, 0.4527587890625, 0.78466796875, 1.1165771484375, 1.448486328125, 1.7803955078125, 2.1123046875, 2.4442138671875, 2.776123046875, 3.1080322265625, 3.43994140625, 3.7718505859375, 4.103759765625, 4.4356689453125, 4.767578125, 5.0994873046875, 5.431396484375, 5.7633056640625, 6.09521484375, 6.4271240234375, 6.759033203125, 7.0909423828125, 7.4228515625, 7.7547607421875, 8.086669921875, 8.4185791015625, 8.75048828125, 9.0823974609375, 9.414306640625, 9.7462158203125, 10.078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 23.0, 29.0, 39.0, 64.0, 129.0, 224.0, 182.0, 86.0, 55.0, 29.0, 18.0, 12.0, 15.0, 6.0, 6.0, 4.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968612670898438, -0.0011520981788635254, -0.001107335090637207, -0.0010625720024108887, -0.0010178089141845703, -0.000973045825958252, -0.0009282827377319336, -0.0008835196495056152, -0.0008387565612792969, -0.0007939934730529785, -0.0007492303848266602, -0.0007044672966003418, -0.0006597042083740234, -0.0006149411201477051, -0.0005701780319213867, -0.0005254149436950684, -0.00048065185546875, -0.00043588876724243164, -0.0003911256790161133, -0.0003463625907897949, -0.00030159950256347656, -0.0002568364143371582, -0.00021207332611083984, -0.00016731023788452148, -0.00012254714965820312, -7.778406143188477e-05, -3.3020973205566406e-05, 1.1742115020751953e-05, 5.650520324707031e-05, 0.00010126829147338867, 0.00014603137969970703, 0.0001907944679260254, 0.00023555755615234375, 0.0002803206443786621, 0.00032508373260498047, 0.00036984682083129883, 0.0004146099090576172, 0.00045937299728393555, 0.0005041360855102539, 0.0005488991737365723, 0.0005936622619628906, 0.000638425350189209, 0.0006831884384155273, 0.0007279515266418457, 0.0007727146148681641, 0.0008174777030944824, 0.0008622407913208008, 0.0009070038795471191, 0.0009517669677734375, 0.0009965300559997559, 0.0010412931442260742, 0.0010860562324523926, 0.001130819320678711, 0.0011755824089050293, 0.0012203454971313477, 0.001265108585357666, 0.0013098716735839844, 0.0013546347618103027, 0.001399397850036621, 0.0014441609382629395, 0.0014889240264892578, 0.0015336871147155762, 0.0015784502029418945, 0.0016232132911682129, 0.0016679763793945312]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 9.0, 16.0, 15.0, 48.0, 149.0, 442.0, 2295.0, 96934.0, 941833.0, 5782.0, 693.0, 193.0, 76.0, 29.0, 14.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.251220703125, -19.65869140625, -19.066162109375, -18.4736328125, -17.881103515625, -17.28857421875, -16.696044921875, -16.103515625, -15.510986328125, -14.91845703125, -14.325927734375, -13.7333984375, -13.140869140625, -12.54833984375, -11.955810546875, -11.36328125, -10.770751953125, -10.17822265625, -9.585693359375, -8.9931640625, -8.400634765625, -7.80810546875, -7.215576171875, -6.623046875, -6.030517578125, -5.43798828125, -4.845458984375, -4.2529296875, -3.660400390625, -3.06787109375, -2.475341796875, -1.8828125, -1.290283203125, -0.69775390625, -0.105224609375, 0.4873046875, 1.079833984375, 1.67236328125, 2.264892578125, 2.857421875, 3.449951171875, 4.04248046875, 4.635009765625, 5.2275390625, 5.820068359375, 6.41259765625, 7.005126953125, 7.59765625, 8.190185546875, 8.78271484375, 9.375244140625, 9.9677734375, 10.560302734375, 11.15283203125, 11.745361328125, 12.337890625, 12.930419921875, 13.52294921875, 14.115478515625, 14.7080078125, 15.300537109375, 15.89306640625, 16.485595703125, 17.078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 23.0, 26.0, 80.0, 178.0, 334.0, 183.0, 71.0, 38.0, 15.0, 12.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.418212890625, -12.02392578125, -11.629638671875, -11.2353515625, -10.841064453125, -10.44677734375, -10.052490234375, -9.658203125, -9.263916015625, -8.86962890625, -8.475341796875, -8.0810546875, -7.686767578125, -7.29248046875, -6.898193359375, -6.50390625, -6.109619140625, -5.71533203125, -5.321044921875, -4.9267578125, -4.532470703125, -4.13818359375, -3.743896484375, -3.349609375, -2.955322265625, -2.56103515625, -2.166748046875, -1.7724609375, -1.378173828125, -0.98388671875, -0.589599609375, -0.1953125, 0.198974609375, 0.59326171875, 0.987548828125, 1.3818359375, 1.776123046875, 2.17041015625, 2.564697265625, 2.958984375, 3.353271484375, 3.74755859375, 4.141845703125, 4.5361328125, 4.930419921875, 5.32470703125, 5.718994140625, 6.11328125, 6.507568359375, 6.90185546875, 7.296142578125, 7.6904296875, 8.084716796875, 8.47900390625, 8.873291015625, 9.267578125, 9.661865234375, 10.05615234375, 10.450439453125, 10.8447265625, 11.239013671875, 11.63330078125, 12.027587890625, 12.421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 12.0, 15.0, 17.0, 50.0, 87.0, 194.0, 379.0, 150.0, 50.0, 20.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-178.47137451171875, -174.04998779296875, -169.62860107421875, -165.2071990966797, -160.7858123779297, -156.3644256591797, -151.9430389404297, -147.52163696289062, -143.10025024414062, -138.67886352539062, -134.25747680664062, -129.83607482910156, -125.41468811035156, -120.99330139160156, -116.57191467285156, -112.15052032470703, -107.72913360595703, -103.30774688720703, -98.8863525390625, -94.4649658203125, -90.04357147216797, -85.62218475341797, -81.20079040527344, -76.77940368652344, -72.35801696777344, -67.93663024902344, -63.515235900878906, -59.093849182128906, -54.672454833984375, -50.251068115234375, -45.82967758178711, -41.408287048339844, -36.98689270019531, -32.56550216674805, -28.14411163330078, -23.72272300720215, -19.301332473754883, -14.879941940307617, -10.458553314208984, -6.037162780761719, -1.6157722473144531, 2.8056178092956543, 7.227007865905762, 11.648397445678711, 16.069787979125977, 20.491178512573242, 24.912567138671875, 29.33395767211914, 33.755348205566406, 38.17673873901367, 42.59812927246094, 47.01951599121094, 51.44091033935547, 55.86229705810547, 60.283687591552734, 64.705078125, 69.12646484375, 73.5478515625, 77.96924591064453, 82.39063262939453, 86.81202697753906, 91.23341369628906, 95.65480041503906, 100.0761947631836, 104.49758911132812]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 9.0, 9.0, 8.0, 23.0, 16.0, 17.0, 20.0, 22.0, 20.0, 37.0, 28.0, 32.0, 28.0, 53.0, 66.0, 99.0, 89.0, 69.0, 39.0, 31.0, 30.0, 35.0, 29.0, 20.0, 13.0, 16.0, 17.0, 9.0, 15.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-68.72903442382812, -66.56958770751953, -64.41014862060547, -62.250701904296875, -60.09125518798828, -57.93181228637695, -55.772369384765625, -53.61292266845703, -51.4534797668457, -49.294036865234375, -47.13459014892578, -44.97514724731445, -42.815704345703125, -40.65625762939453, -38.4968147277832, -36.337371826171875, -34.17792510986328, -32.01848220825195, -29.85903549194336, -27.69959259033203, -25.54014778137207, -23.38070297241211, -21.22126007080078, -19.06181526184082, -16.90237045288086, -14.742925643920898, -12.583481788635254, -10.42403793334961, -8.264593124389648, -6.1051483154296875, -3.945704460144043, -1.7862606048583984, 0.3731842041015625, 2.5326285362243652, 4.692072868347168, 6.851517200469971, 9.010961532592773, 11.170406341552734, 13.329850196838379, 15.489294052124023, 17.648738861083984, 19.808183670043945, 21.967628479003906, 24.127071380615234, 26.286516189575195, 28.445960998535156, 30.605403900146484, 32.76484680175781, 34.924293518066406, 37.083736419677734, 39.24318313598633, 41.402626037597656, 43.56207275390625, 45.72151565551758, 47.880958557128906, 50.0404052734375, 52.19984817504883, 54.359291076660156, 56.51873779296875, 58.67818069458008, 60.837623596191406, 62.9970703125, 65.1565170288086, 67.31595611572266, 69.47540283203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 13.0, 15.0, 29.0, 57.0, 95.0, 195.0, 387.0, 731.0, 1691.0, 4567.0, 16015.0, 97786.0, 1041812.0, 2605531.0, 371246.0, 40148.0, 8725.0, 2922.0, 1208.0, 513.0, 255.0, 143.0, 78.0, 45.0, 27.0, 16.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.7071533203125, -8.445556640625, -8.1839599609375, -7.92236328125, -7.6607666015625, -7.399169921875, -7.1375732421875, -6.8759765625, -6.6143798828125, -6.352783203125, -6.0911865234375, -5.82958984375, -5.5679931640625, -5.306396484375, -5.0447998046875, -4.783203125, -4.5216064453125, -4.260009765625, -3.9984130859375, -3.73681640625, -3.4752197265625, -3.213623046875, -2.9520263671875, -2.6904296875, -2.4288330078125, -2.167236328125, -1.9056396484375, -1.64404296875, -1.3824462890625, -1.120849609375, -0.8592529296875, -0.59765625, -0.3360595703125, -0.074462890625, 0.1871337890625, 0.44873046875, 0.7103271484375, 0.971923828125, 1.2335205078125, 1.4951171875, 1.7567138671875, 2.018310546875, 2.2799072265625, 2.54150390625, 2.8031005859375, 3.064697265625, 3.3262939453125, 3.587890625, 3.8494873046875, 4.111083984375, 4.3726806640625, 4.63427734375, 4.8958740234375, 5.157470703125, 5.4190673828125, 5.6806640625, 5.9422607421875, 6.203857421875, 6.4654541015625, 6.72705078125, 6.9886474609375, 7.250244140625, 7.5118408203125, 7.7734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 12.0, 17.0, 13.0, 21.0, 17.0, 32.0, 17.0, 24.0, 33.0, 42.0, 41.0, 32.0, 50.0, 38.0, 29.0, 43.0, 51.0, 47.0, 42.0, 46.0, 36.0, 40.0, 41.0, 33.0, 24.0, 23.0, 20.0, 15.0, 24.0, 19.0, 15.0, 4.0, 6.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45916748046875, -4.3050537109375, -4.15093994140625, -3.996826171875, -3.84271240234375, -3.6885986328125, -3.53448486328125, -3.38037109375, -3.22625732421875, -3.0721435546875, -2.91802978515625, -2.763916015625, -2.60980224609375, -2.4556884765625, -2.30157470703125, -2.1474609375, -1.99334716796875, -1.8392333984375, -1.68511962890625, -1.531005859375, -1.37689208984375, -1.2227783203125, -1.06866455078125, -0.91455078125, -0.76043701171875, -0.6063232421875, -0.45220947265625, -0.298095703125, -0.14398193359375, 0.0101318359375, 0.16424560546875, 0.318359375, 0.47247314453125, 0.6265869140625, 0.78070068359375, 0.934814453125, 1.08892822265625, 1.2430419921875, 1.39715576171875, 1.55126953125, 1.70538330078125, 1.8594970703125, 2.01361083984375, 2.167724609375, 2.32183837890625, 2.4759521484375, 2.63006591796875, 2.7841796875, 2.93829345703125, 3.0924072265625, 3.24652099609375, 3.400634765625, 3.55474853515625, 3.7088623046875, 3.86297607421875, 4.01708984375, 4.17120361328125, 4.3253173828125, 4.47943115234375, 4.633544921875, 4.78765869140625, 4.9417724609375, 5.09588623046875, 5.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 17.0, 62.0, 132.0, 371.0, 1944.0, 447515.0, 3739835.0, 3528.0, 541.0, 204.0, 72.0, 28.0, 18.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9375, -38.4638671875, -36.990234375, -35.5166015625, -34.04296875, -32.5693359375, -31.095703125, -29.6220703125, -28.1484375, -26.6748046875, -25.201171875, -23.7275390625, -22.25390625, -20.7802734375, -19.306640625, -17.8330078125, -16.359375, -14.8857421875, -13.412109375, -11.9384765625, -10.46484375, -8.9912109375, -7.517578125, -6.0439453125, -4.5703125, -3.0966796875, -1.623046875, -0.1494140625, 1.32421875, 2.7978515625, 4.271484375, 5.7451171875, 7.21875, 8.6923828125, 10.166015625, 11.6396484375, 13.11328125, 14.5869140625, 16.060546875, 17.5341796875, 19.0078125, 20.4814453125, 21.955078125, 23.4287109375, 24.90234375, 26.3759765625, 27.849609375, 29.3232421875, 30.796875, 32.2705078125, 33.744140625, 35.2177734375, 36.69140625, 38.1650390625, 39.638671875, 41.1123046875, 42.5859375, 44.0595703125, 45.533203125, 47.0068359375, 48.48046875, 49.9541015625, 51.427734375, 52.9013671875, 54.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 12.0, 11.0, 17.0, 40.0, 80.0, 143.0, 364.0, 830.0, 1212.0, 753.0, 299.0, 149.0, 65.0, 44.0, 18.0, 17.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.623779296875, -10.01318359375, -9.402587890625, -8.7919921875, -8.181396484375, -7.57080078125, -6.960205078125, -6.349609375, -5.739013671875, -5.12841796875, -4.517822265625, -3.9072265625, -3.296630859375, -2.68603515625, -2.075439453125, -1.46484375, -0.854248046875, -0.24365234375, 0.366943359375, 0.9775390625, 1.588134765625, 2.19873046875, 2.809326171875, 3.419921875, 4.030517578125, 4.64111328125, 5.251708984375, 5.8623046875, 6.472900390625, 7.08349609375, 7.694091796875, 8.3046875, 8.915283203125, 9.52587890625, 10.136474609375, 10.7470703125, 11.357666015625, 11.96826171875, 12.578857421875, 13.189453125, 13.800048828125, 14.41064453125, 15.021240234375, 15.6318359375, 16.242431640625, 16.85302734375, 17.463623046875, 18.07421875, 18.684814453125, 19.29541015625, 19.906005859375, 20.5166015625, 21.127197265625, 21.73779296875, 22.348388671875, 22.958984375, 23.569580078125, 24.18017578125, 24.790771484375, 25.4013671875, 26.011962890625, 26.62255859375, 27.233154296875, 27.84375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 37.0, 125.0, 299.0, 326.0, 134.0, 33.0, 13.0, 8.0, 6.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-262.331298828125, -255.21958923339844, -248.1078643798828, -240.99615478515625, -233.8844451904297, -226.77273559570312, -219.6610107421875, -212.54930114746094, -205.43759155273438, -198.3258819580078, -191.2141571044922, -184.10244750976562, -176.99073791503906, -169.8790283203125, -162.76730346679688, -155.6555938720703, -148.5438690185547, -141.43215942382812, -134.3204345703125, -127.20872497558594, -120.09701538085938, -112.98529815673828, -105.87358093261719, -98.76187133789062, -91.65015411376953, -84.53843688964844, -77.42672729492188, -70.31501007080078, -63.20329666137695, -56.091583251953125, -48.97986602783203, -41.8681526184082, -34.75642395019531, -27.644710540771484, -20.532995223999023, -13.421279907226562, -6.309566497802734, 0.8021469116210938, 7.9138641357421875, 15.025577545166016, 22.137290954589844, 29.249004364013672, 36.3607177734375, 43.472434997558594, 50.58414840698242, 57.69586181640625, 64.80757904052734, 71.91929626464844, 79.031005859375, 86.1427230834961, 93.25443267822266, 100.36614990234375, 107.47785949707031, 114.5895767211914, 121.7012939453125, 128.81300354003906, 135.92471313476562, 143.0364227294922, 150.1481475830078, 157.25985717773438, 164.37156677246094, 171.4832763671875, 178.59500122070312, 185.7067108154297, 192.8184356689453]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 9.0, 12.0, 5.0, 7.0, 8.0, 6.0, 15.0, 20.0, 32.0, 21.0, 30.0, 32.0, 33.0, 38.0, 40.0, 43.0, 48.0, 46.0, 56.0, 53.0, 41.0, 48.0, 53.0, 28.0, 45.0, 30.0, 31.0, 27.0, 33.0, 27.0, 15.0, 12.0, 13.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-68.60537719726562, -66.64068603515625, -64.67599487304688, -62.711299896240234, -60.746604919433594, -58.78191375732422, -56.817222595214844, -54.8525276184082, -52.88783264160156, -50.92314147949219, -48.95844650268555, -46.99375534057617, -45.02906036376953, -43.064369201660156, -41.09967803955078, -39.13498306274414, -37.170291900634766, -35.20560073852539, -33.24090576171875, -31.276214599609375, -29.311519622802734, -27.34682846069336, -25.38213539123535, -23.417442321777344, -21.452749252319336, -19.488056182861328, -17.52336311340332, -15.558670997619629, -13.593977928161621, -11.629284858703613, -9.664592742919922, -7.699899673461914, -5.735206604003906, -3.7705137729644775, -1.8058209419250488, 0.15887165069580078, 2.1235647201538086, 4.088257789611816, 6.052949905395508, 8.017642974853516, 9.982336044311523, 11.947029113769531, 13.911722183227539, 15.87641429901123, 17.841106414794922, 19.805801391601562, 21.770492553710938, 23.735185623168945, 25.699878692626953, 27.66457176208496, 29.62926483154297, 31.593955993652344, 33.558650970458984, 35.52334213256836, 37.488037109375, 39.452728271484375, 41.41741943359375, 43.382110595703125, 45.346805572509766, 47.31149673461914, 49.27619171142578, 51.240882873535156, 53.20557403564453, 55.17026901245117, 57.13496398925781]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 31.0, 50.0, 69.0, 100.0, 190.0, 276.0, 466.0, 914.0, 1909.0, 4264.0, 10600.0, 28629.0, 84386.0, 273120.0, 414397.0, 150997.0, 48725.0, 16838.0, 6728.0, 2861.0, 1361.0, 647.0, 355.0, 216.0, 122.0, 84.0, 50.0, 42.0, 19.0, 15.0, 12.0, 10.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.03125, -9.7545166015625, -9.477783203125, -9.2010498046875, -8.92431640625, -8.6475830078125, -8.370849609375, -8.0941162109375, -7.8173828125, -7.5406494140625, -7.263916015625, -6.9871826171875, -6.71044921875, -6.4337158203125, -6.156982421875, -5.8802490234375, -5.603515625, -5.3267822265625, -5.050048828125, -4.7733154296875, -4.49658203125, -4.2198486328125, -3.943115234375, -3.6663818359375, -3.3896484375, -3.1129150390625, -2.836181640625, -2.5594482421875, -2.28271484375, -2.0059814453125, -1.729248046875, -1.4525146484375, -1.17578125, -0.8990478515625, -0.622314453125, -0.3455810546875, -0.06884765625, 0.2078857421875, 0.484619140625, 0.7613525390625, 1.0380859375, 1.3148193359375, 1.591552734375, 1.8682861328125, 2.14501953125, 2.4217529296875, 2.698486328125, 2.9752197265625, 3.251953125, 3.5286865234375, 3.805419921875, 4.0821533203125, 4.35888671875, 4.6356201171875, 4.912353515625, 5.1890869140625, 5.4658203125, 5.7425537109375, 6.019287109375, 6.2960205078125, 6.57275390625, 6.8494873046875, 7.126220703125, 7.4029541015625, 7.6796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 10.0, 8.0, 6.0, 6.0, 12.0, 15.0, 18.0, 22.0, 23.0, 40.0, 33.0, 38.0, 39.0, 36.0, 41.0, 47.0, 57.0, 48.0, 41.0, 53.0, 48.0, 41.0, 44.0, 38.0, 29.0, 29.0, 22.0, 32.0, 24.0, 19.0, 17.0, 15.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.44384765625, -4.2744140625, -4.10498046875, -3.935546875, -3.76611328125, -3.5966796875, -3.42724609375, -3.2578125, -3.08837890625, -2.9189453125, -2.74951171875, -2.580078125, -2.41064453125, -2.2412109375, -2.07177734375, -1.90234375, -1.73291015625, -1.5634765625, -1.39404296875, -1.224609375, -1.05517578125, -0.8857421875, -0.71630859375, -0.546875, -0.37744140625, -0.2080078125, -0.03857421875, 0.130859375, 0.30029296875, 0.4697265625, 0.63916015625, 0.80859375, 0.97802734375, 1.1474609375, 1.31689453125, 1.486328125, 1.65576171875, 1.8251953125, 1.99462890625, 2.1640625, 2.33349609375, 2.5029296875, 2.67236328125, 2.841796875, 3.01123046875, 3.1806640625, 3.35009765625, 3.51953125, 3.68896484375, 3.8583984375, 4.02783203125, 4.197265625, 4.36669921875, 4.5361328125, 4.70556640625, 4.875, 5.04443359375, 5.2138671875, 5.38330078125, 5.552734375, 5.72216796875, 5.8916015625, 6.06103515625, 6.23046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 9.0, 19.0, 16.0, 29.0, 30.0, 48.0, 76.0, 112.0, 163.0, 240.0, 379.0, 587.0, 1315.0, 2949.0, 10774.0, 89488.0, 853206.0, 73806.0, 9649.0, 2754.0, 1206.0, 659.0, 340.0, 213.0, 156.0, 98.0, 61.0, 44.0, 39.0, 16.0, 14.0, 19.0, 7.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.875, -23.22021484375, -22.5654296875, -21.91064453125, -21.255859375, -20.60107421875, -19.9462890625, -19.29150390625, -18.63671875, -17.98193359375, -17.3271484375, -16.67236328125, -16.017578125, -15.36279296875, -14.7080078125, -14.05322265625, -13.3984375, -12.74365234375, -12.0888671875, -11.43408203125, -10.779296875, -10.12451171875, -9.4697265625, -8.81494140625, -8.16015625, -7.50537109375, -6.8505859375, -6.19580078125, -5.541015625, -4.88623046875, -4.2314453125, -3.57666015625, -2.921875, -2.26708984375, -1.6123046875, -0.95751953125, -0.302734375, 0.35205078125, 1.0068359375, 1.66162109375, 2.31640625, 2.97119140625, 3.6259765625, 4.28076171875, 4.935546875, 5.59033203125, 6.2451171875, 6.89990234375, 7.5546875, 8.20947265625, 8.8642578125, 9.51904296875, 10.173828125, 10.82861328125, 11.4833984375, 12.13818359375, 12.79296875, 13.44775390625, 14.1025390625, 14.75732421875, 15.412109375, 16.06689453125, 16.7216796875, 17.37646484375, 18.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 4.0, 4.0, 16.0, 9.0, 12.0, 15.0, 18.0, 28.0, 24.0, 42.0, 23.0, 43.0, 44.0, 48.0, 64.0, 61.0, 65.0, 65.0, 45.0, 51.0, 49.0, 33.0, 37.0, 29.0, 25.0, 31.0, 26.0, 11.0, 13.0, 11.0, 9.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.26123046875, -20.6005859375, -19.93994140625, -19.279296875, -18.61865234375, -17.9580078125, -17.29736328125, -16.63671875, -15.97607421875, -15.3154296875, -14.65478515625, -13.994140625, -13.33349609375, -12.6728515625, -12.01220703125, -11.3515625, -10.69091796875, -10.0302734375, -9.36962890625, -8.708984375, -8.04833984375, -7.3876953125, -6.72705078125, -6.06640625, -5.40576171875, -4.7451171875, -4.08447265625, -3.423828125, -2.76318359375, -2.1025390625, -1.44189453125, -0.78125, -0.12060546875, 0.5400390625, 1.20068359375, 1.861328125, 2.52197265625, 3.1826171875, 3.84326171875, 4.50390625, 5.16455078125, 5.8251953125, 6.48583984375, 7.146484375, 7.80712890625, 8.4677734375, 9.12841796875, 9.7890625, 10.44970703125, 11.1103515625, 11.77099609375, 12.431640625, 13.09228515625, 13.7529296875, 14.41357421875, 15.07421875, 15.73486328125, 16.3955078125, 17.05615234375, 17.716796875, 18.37744140625, 19.0380859375, 19.69873046875, 20.359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 38.0, 46.0, 67.0, 94.0, 200.0, 432.0, 1227.0, 5104.0, 55846.0, 950498.0, 29454.0, 3769.0, 925.0, 338.0, 188.0, 108.0, 57.0, 34.0, 24.0, 17.0, 20.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.4071044921875, -10.095458984375, -9.7838134765625, -9.47216796875, -9.1605224609375, -8.848876953125, -8.5372314453125, -8.2255859375, -7.9139404296875, -7.602294921875, -7.2906494140625, -6.97900390625, -6.6673583984375, -6.355712890625, -6.0440673828125, -5.732421875, -5.4207763671875, -5.109130859375, -4.7974853515625, -4.48583984375, -4.1741943359375, -3.862548828125, -3.5509033203125, -3.2392578125, -2.9276123046875, -2.615966796875, -2.3043212890625, -1.99267578125, -1.6810302734375, -1.369384765625, -1.0577392578125, -0.74609375, -0.4344482421875, -0.122802734375, 0.1888427734375, 0.50048828125, 0.8121337890625, 1.123779296875, 1.4354248046875, 1.7470703125, 2.0587158203125, 2.370361328125, 2.6820068359375, 2.99365234375, 3.3052978515625, 3.616943359375, 3.9285888671875, 4.240234375, 4.5518798828125, 4.863525390625, 5.1751708984375, 5.48681640625, 5.7984619140625, 6.110107421875, 6.4217529296875, 6.7333984375, 7.0450439453125, 7.356689453125, 7.6683349609375, 7.97998046875, 8.2916259765625, 8.603271484375, 8.9149169921875, 9.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 9.0, 13.0, 14.0, 34.0, 49.0, 77.0, 154.0, 223.0, 138.0, 68.0, 51.0, 37.0, 22.0, 15.0, 7.0, 9.0, 7.0, 4.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016536712646484375, -0.0016117841005325317, -0.001569896936416626, -0.0015280097723007202, -0.0014861226081848145, -0.0014442354440689087, -0.001402348279953003, -0.0013604611158370972, -0.0013185739517211914, -0.0012766867876052856, -0.0012347996234893799, -0.0011929124593734741, -0.0011510252952575684, -0.0011091381311416626, -0.0010672509670257568, -0.001025363802909851, -0.0009834766387939453, -0.0009415894746780396, -0.0008997023105621338, -0.000857815146446228, -0.0008159279823303223, -0.0007740408182144165, -0.0007321536540985107, -0.000690266489982605, -0.0006483793258666992, -0.0006064921617507935, -0.0005646049976348877, -0.0005227178335189819, -0.00048083066940307617, -0.0004389435052871704, -0.00039705634117126465, -0.0003551691770553589, -0.0003132820129394531, -0.00027139484882354736, -0.0002295076847076416, -0.00018762052059173584, -0.00014573335647583008, -0.00010384619235992432, -6.195902824401855e-05, -2.0071864128112793e-05, 2.181529998779297e-05, 6.370246410369873e-05, 0.00010558962821960449, 0.00014747679233551025, 0.00018936395645141602, 0.00023125112056732178, 0.00027313828468322754, 0.0003150254487991333, 0.00035691261291503906, 0.0003987997770309448, 0.0004406869411468506, 0.00048257410526275635, 0.0005244612693786621, 0.0005663484334945679, 0.0006082355976104736, 0.0006501227617263794, 0.0006920099258422852, 0.0007338970899581909, 0.0007757842540740967, 0.0008176714181900024, 0.0008595585823059082, 0.000901445746421814, 0.0009433329105377197, 0.0009852200746536255, 0.0010271072387695312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 9.0, 26.0, 28.0, 47.0, 95.0, 267.0, 609.0, 2214.0, 18985.0, 933759.0, 85650.0, 5180.0, 992.0, 360.0, 140.0, 77.0, 42.0, 28.0, 12.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.58056640625, -12.2470703125, -11.91357421875, -11.580078125, -11.24658203125, -10.9130859375, -10.57958984375, -10.24609375, -9.91259765625, -9.5791015625, -9.24560546875, -8.912109375, -8.57861328125, -8.2451171875, -7.91162109375, -7.578125, -7.24462890625, -6.9111328125, -6.57763671875, -6.244140625, -5.91064453125, -5.5771484375, -5.24365234375, -4.91015625, -4.57666015625, -4.2431640625, -3.90966796875, -3.576171875, -3.24267578125, -2.9091796875, -2.57568359375, -2.2421875, -1.90869140625, -1.5751953125, -1.24169921875, -0.908203125, -0.57470703125, -0.2412109375, 0.09228515625, 0.42578125, 0.75927734375, 1.0927734375, 1.42626953125, 1.759765625, 2.09326171875, 2.4267578125, 2.76025390625, 3.09375, 3.42724609375, 3.7607421875, 4.09423828125, 4.427734375, 4.76123046875, 5.0947265625, 5.42822265625, 5.76171875, 6.09521484375, 6.4287109375, 6.76220703125, 7.095703125, 7.42919921875, 7.7626953125, 8.09619140625, 8.4296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 3.0, 3.0, 5.0, 4.0, 5.0, 14.0, 12.0, 17.0, 26.0, 34.0, 49.0, 60.0, 90.0, 118.0, 151.0, 94.0, 78.0, 53.0, 33.0, 38.0, 29.0, 17.0, 14.0, 11.0, 13.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.6251220703125, -5.461181640625, -5.2972412109375, -5.13330078125, -4.9693603515625, -4.805419921875, -4.6414794921875, -4.4775390625, -4.3135986328125, -4.149658203125, -3.9857177734375, -3.82177734375, -3.6578369140625, -3.493896484375, -3.3299560546875, -3.166015625, -3.0020751953125, -2.838134765625, -2.6741943359375, -2.51025390625, -2.3463134765625, -2.182373046875, -2.0184326171875, -1.8544921875, -1.6905517578125, -1.526611328125, -1.3626708984375, -1.19873046875, -1.0347900390625, -0.870849609375, -0.7069091796875, -0.54296875, -0.3790283203125, -0.215087890625, -0.0511474609375, 0.11279296875, 0.2767333984375, 0.440673828125, 0.6046142578125, 0.7685546875, 0.9324951171875, 1.096435546875, 1.2603759765625, 1.42431640625, 1.5882568359375, 1.752197265625, 1.9161376953125, 2.080078125, 2.2440185546875, 2.407958984375, 2.5718994140625, 2.73583984375, 2.8997802734375, 3.063720703125, 3.2276611328125, 3.3916015625, 3.5555419921875, 3.719482421875, 3.8834228515625, 4.04736328125, 4.2113037109375, 4.375244140625, 4.5391845703125, 4.703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 60.0, 656.0, 238.0, 32.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.8194580078125, -679.603271484375, -665.3870849609375, -651.1708984375, -636.9547119140625, -622.738525390625, -608.5223388671875, -594.30615234375, -580.0899658203125, -565.873779296875, -551.6575927734375, -537.44140625, -523.2252197265625, -509.009033203125, -494.7928466796875, -480.57666015625, -466.3605041503906, -452.1443176269531, -437.9281311035156, -423.7119445800781, -409.4957580566406, -395.2795715332031, -381.06341552734375, -366.84722900390625, -352.63104248046875, -338.41485595703125, -324.19866943359375, -309.98248291015625, -295.76629638671875, -281.55010986328125, -267.33392333984375, -253.1177520751953, -238.90151977539062, -224.68533325195312, -210.46914672851562, -196.25296020507812, -182.03677368164062, -167.82058715820312, -153.6044158935547, -139.3882293701172, -125.17204284667969, -110.95585632324219, -96.73966979980469, -82.52349090576172, -68.30730438232422, -54.09111785888672, -39.87493896484375, -25.65875244140625, -11.44256591796875, 2.773618698120117, 16.989803314208984, 31.20598602294922, 45.42217254638672, 59.63835906982422, 73.85453796386719, 88.07072448730469, 102.28691101074219, 116.50309753417969, 130.7192840576172, 144.93545532226562, 159.15164184570312, 173.36782836914062, 187.58401489257812, 201.80020141601562, 216.01638793945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 6.0, 18.0, 14.0, 19.0, 25.0, 30.0, 31.0, 34.0, 28.0, 34.0, 50.0, 124.0, 170.0, 70.0, 39.0, 49.0, 37.0, 26.0, 24.0, 26.0, 28.0, 13.0, 15.0, 17.0, 7.0, 10.0, 8.0, 5.0, 1.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.43122863769531, -98.28334045410156, -95.13545989990234, -91.9875717163086, -88.83969116210938, -85.69180297851562, -82.54391479492188, -79.39603424072266, -76.24815368652344, -73.10026550292969, -69.95238494873047, -66.80449676513672, -63.6566162109375, -60.50872802734375, -57.360843658447266, -54.21295928955078, -51.06507110595703, -47.91718673706055, -44.76930236816406, -41.62141418457031, -38.473533630371094, -35.325645446777344, -32.17776107788086, -29.029876708984375, -25.88199234008789, -22.734107971191406, -19.586223602294922, -16.438337326049805, -13.29045295715332, -10.142568588256836, -6.994682312011719, -3.8467979431152344, -0.69891357421875, 2.4489712715148926, 5.596856117248535, 8.744741439819336, 11.89262580871582, 15.040510177612305, 18.188396453857422, 21.336280822753906, 24.48416519165039, 27.632049560546875, 30.77993392944336, 33.927818298339844, 37.075706481933594, 40.22358703613281, 43.37147521972656, 46.51935958862305, 49.66724395751953, 52.815128326416016, 55.9630126953125, 59.11090087890625, 62.25878143310547, 65.40666961669922, 68.55455017089844, 71.70243835449219, 74.85032653808594, 77.99821472167969, 81.1460952758789, 84.29398345947266, 87.44186401367188, 90.58975219726562, 93.73764038085938, 96.8855209350586, 100.03340148925781]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 12.0, 12.0, 15.0, 28.0, 52.0, 85.0, 123.0, 203.0, 333.0, 569.0, 1087.0, 2200.0, 5725.0, 21654.0, 209384.0, 2352085.0, 1475914.0, 102566.0, 14152.0, 4260.0, 1719.0, 863.0, 480.0, 301.0, 165.0, 94.0, 74.0, 41.0, 34.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6641845703125, -11.273681640625, -10.8831787109375, -10.49267578125, -10.1021728515625, -9.711669921875, -9.3211669921875, -8.9306640625, -8.5401611328125, -8.149658203125, -7.7591552734375, -7.36865234375, -6.9781494140625, -6.587646484375, -6.1971435546875, -5.806640625, -5.4161376953125, -5.025634765625, -4.6351318359375, -4.24462890625, -3.8541259765625, -3.463623046875, -3.0731201171875, -2.6826171875, -2.2921142578125, -1.901611328125, -1.5111083984375, -1.12060546875, -0.7301025390625, -0.339599609375, 0.0509033203125, 0.44140625, 0.8319091796875, 1.222412109375, 1.6129150390625, 2.00341796875, 2.3939208984375, 2.784423828125, 3.1749267578125, 3.5654296875, 3.9559326171875, 4.346435546875, 4.7369384765625, 5.12744140625, 5.5179443359375, 5.908447265625, 6.2989501953125, 6.689453125, 7.0799560546875, 7.470458984375, 7.8609619140625, 8.25146484375, 8.6419677734375, 9.032470703125, 9.4229736328125, 9.8134765625, 10.2039794921875, 10.594482421875, 10.9849853515625, 11.37548828125, 11.7659912109375, 12.156494140625, 12.5469970703125, 12.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 5.0, 9.0, 13.0, 13.0, 12.0, 24.0, 22.0, 29.0, 27.0, 26.0, 26.0, 33.0, 37.0, 34.0, 42.0, 47.0, 47.0, 41.0, 50.0, 50.0, 37.0, 40.0, 34.0, 33.0, 35.0, 26.0, 32.0, 26.0, 19.0, 22.0, 23.0, 11.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.15789794921875, -4.0072021484375, -3.85650634765625, -3.705810546875, -3.55511474609375, -3.4044189453125, -3.25372314453125, -3.10302734375, -2.95233154296875, -2.8016357421875, -2.65093994140625, -2.500244140625, -2.34954833984375, -2.1988525390625, -2.04815673828125, -1.8974609375, -1.74676513671875, -1.5960693359375, -1.44537353515625, -1.294677734375, -1.14398193359375, -0.9932861328125, -0.84259033203125, -0.69189453125, -0.54119873046875, -0.3905029296875, -0.23980712890625, -0.089111328125, 0.06158447265625, 0.2122802734375, 0.36297607421875, 0.513671875, 0.66436767578125, 0.8150634765625, 0.96575927734375, 1.116455078125, 1.26715087890625, 1.4178466796875, 1.56854248046875, 1.71923828125, 1.86993408203125, 2.0206298828125, 2.17132568359375, 2.322021484375, 2.47271728515625, 2.6234130859375, 2.77410888671875, 2.9248046875, 3.07550048828125, 3.2261962890625, 3.37689208984375, 3.527587890625, 3.67828369140625, 3.8289794921875, 3.97967529296875, 4.13037109375, 4.28106689453125, 4.4317626953125, 4.58245849609375, 4.733154296875, 4.88385009765625, 5.0345458984375, 5.18524169921875, 5.3359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 9.0, 14.0, 30.0, 65.0, 103.0, 207.0, 412.0, 1010.0, 3957.0, 362168.0, 3817162.0, 6768.0, 1358.0, 473.0, 255.0, 125.0, 62.0, 35.0, 24.0, 12.0, 11.0, 10.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.53125, -49.76123046875, -47.9912109375, -46.22119140625, -44.451171875, -42.68115234375, -40.9111328125, -39.14111328125, -37.37109375, -35.60107421875, -33.8310546875, -32.06103515625, -30.291015625, -28.52099609375, -26.7509765625, -24.98095703125, -23.2109375, -21.44091796875, -19.6708984375, -17.90087890625, -16.130859375, -14.36083984375, -12.5908203125, -10.82080078125, -9.05078125, -7.28076171875, -5.5107421875, -3.74072265625, -1.970703125, -0.20068359375, 1.5693359375, 3.33935546875, 5.109375, 6.87939453125, 8.6494140625, 10.41943359375, 12.189453125, 13.95947265625, 15.7294921875, 17.49951171875, 19.26953125, 21.03955078125, 22.8095703125, 24.57958984375, 26.349609375, 28.11962890625, 29.8896484375, 31.65966796875, 33.4296875, 35.19970703125, 36.9697265625, 38.73974609375, 40.509765625, 42.27978515625, 44.0498046875, 45.81982421875, 47.58984375, 49.35986328125, 51.1298828125, 52.89990234375, 54.669921875, 56.43994140625, 58.2099609375, 59.97998046875, 61.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 14.0, 13.0, 24.0, 28.0, 63.0, 92.0, 102.0, 204.0, 347.0, 575.0, 703.0, 676.0, 427.0, 248.0, 162.0, 100.0, 78.0, 47.0, 43.0, 28.0, 20.0, 19.0, 10.0, 11.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -12.901611328125, -12.33447265625, -11.767333984375, -11.2001953125, -10.633056640625, -10.06591796875, -9.498779296875, -8.931640625, -8.364501953125, -7.79736328125, -7.230224609375, -6.6630859375, -6.095947265625, -5.52880859375, -4.961669921875, -4.39453125, -3.827392578125, -3.26025390625, -2.693115234375, -2.1259765625, -1.558837890625, -0.99169921875, -0.424560546875, 0.142578125, 0.709716796875, 1.27685546875, 1.843994140625, 2.4111328125, 2.978271484375, 3.54541015625, 4.112548828125, 4.6796875, 5.246826171875, 5.81396484375, 6.381103515625, 6.9482421875, 7.515380859375, 8.08251953125, 8.649658203125, 9.216796875, 9.783935546875, 10.35107421875, 10.918212890625, 11.4853515625, 12.052490234375, 12.61962890625, 13.186767578125, 13.75390625, 14.321044921875, 14.88818359375, 15.455322265625, 16.0224609375, 16.589599609375, 17.15673828125, 17.723876953125, 18.291015625, 18.858154296875, 19.42529296875, 19.992431640625, 20.5595703125, 21.126708984375, 21.69384765625, 22.260986328125, 22.828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 12.0, 22.0, 56.0, 128.0, 202.0, 231.0, 150.0, 67.0, 38.0, 16.0, 12.0, 9.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.5052947998047, -159.9416961669922, -152.3780975341797, -144.81448364257812, -137.25088500976562, -129.68728637695312, -122.12368774414062, -114.56008911132812, -106.9964828491211, -99.4328842163086, -91.86927795410156, -84.30567932128906, -76.74208068847656, -69.17847442626953, -61.61487579345703, -54.051273345947266, -46.4876708984375, -38.924068450927734, -31.3604679107666, -23.79686737060547, -16.233264923095703, -8.669662475585938, -1.1060638427734375, 6.457538604736328, 14.021141052246094, 21.58474349975586, 29.148344039916992, 36.711944580078125, 44.27554702758789, 51.839149475097656, 59.402748107910156, 66.96635437011719, 74.52996826171875, 82.09356689453125, 89.65717315673828, 97.22077178955078, 104.78437805175781, 112.34797668457031, 119.91157531738281, 127.47517395019531, 135.03878784179688, 142.60238647460938, 150.16598510742188, 157.72958374023438, 165.29319763183594, 172.85679626464844, 180.42039489746094, 187.98399353027344, 195.54759216308594, 203.11119079589844, 210.67478942871094, 218.2384033203125, 225.802001953125, 233.3656005859375, 240.92919921875, 248.4927978515625, 256.056396484375, 263.6199951171875, 271.18359375, 278.7471923828125, 286.310791015625, 293.8743896484375, 301.43798828125, 309.0016174316406, 316.5652160644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 9.0, 7.0, 16.0, 25.0, 17.0, 32.0, 31.0, 48.0, 60.0, 53.0, 67.0, 55.0, 77.0, 91.0, 74.0, 56.0, 53.0, 41.0, 40.0, 29.0, 28.0, 14.0, 18.0, 8.0, 10.0, 3.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.36074829101562, -152.4566650390625, -148.55259704589844, -144.6485137939453, -140.74444580078125, -136.84036254882812, -132.93629455566406, -129.03221130371094, -125.12814331054688, -121.22406768798828, -117.31999206542969, -113.4159164428711, -109.5118408203125, -105.6077651977539, -101.70368957519531, -97.79960632324219, -93.8955307006836, -89.991455078125, -86.0873794555664, -82.18330383300781, -78.27922821044922, -74.37515258789062, -70.4710693359375, -66.56700134277344, -62.66292190551758, -58.758846282958984, -54.85477066040039, -50.95069122314453, -47.04661560058594, -43.142539978027344, -39.23846435546875, -35.334388732910156, -31.430320739746094, -27.5262451171875, -23.622169494628906, -19.71809196472168, -15.814016342163086, -11.909940719604492, -8.005863189697266, -4.101787567138672, -0.19771194458007812, 3.706364154815674, 7.610440254211426, 11.514516830444336, 15.41859245300293, 19.322668075561523, 23.22674560546875, 27.130821228027344, 31.034896850585938, 34.93897247314453, 38.843048095703125, 42.74712371826172, 46.65119934082031, 50.555274963378906, 54.459354400634766, 58.36343002319336, 62.26750564575195, 66.17158508300781, 70.0756607055664, 73.979736328125, 77.8838119506836, 81.78788757324219, 85.69196319580078, 89.59603881835938, 93.50011444091797]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 11.0, 13.0, 13.0, 22.0, 23.0, 54.0, 73.0, 116.0, 196.0, 347.0, 597.0, 1044.0, 2052.0, 4157.0, 9037.0, 23016.0, 67207.0, 248956.0, 492519.0, 131845.0, 39780.0, 14690.0, 6219.0, 2954.0, 1525.0, 830.0, 501.0, 262.0, 175.0, 106.0, 79.0, 40.0, 33.0, 21.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.2578125, -9.0025634765625, -8.747314453125, -8.4920654296875, -8.23681640625, -7.9815673828125, -7.726318359375, -7.4710693359375, -7.2158203125, -6.9605712890625, -6.705322265625, -6.4500732421875, -6.19482421875, -5.9395751953125, -5.684326171875, -5.4290771484375, -5.173828125, -4.9185791015625, -4.663330078125, -4.4080810546875, -4.15283203125, -3.8975830078125, -3.642333984375, -3.3870849609375, -3.1318359375, -2.8765869140625, -2.621337890625, -2.3660888671875, -2.11083984375, -1.8555908203125, -1.600341796875, -1.3450927734375, -1.08984375, -0.8345947265625, -0.579345703125, -0.3240966796875, -0.06884765625, 0.1864013671875, 0.441650390625, 0.6968994140625, 0.9521484375, 1.2073974609375, 1.462646484375, 1.7178955078125, 1.97314453125, 2.2283935546875, 2.483642578125, 2.7388916015625, 2.994140625, 3.2493896484375, 3.504638671875, 3.7598876953125, 4.01513671875, 4.2703857421875, 4.525634765625, 4.7808837890625, 5.0361328125, 5.2913818359375, 5.546630859375, 5.8018798828125, 6.05712890625, 6.3123779296875, 6.567626953125, 6.8228759765625, 7.078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 16.0, 24.0, 19.0, 27.0, 31.0, 48.0, 38.0, 37.0, 52.0, 56.0, 65.0, 69.0, 58.0, 51.0, 56.0, 50.0, 60.0, 42.0, 32.0, 36.0, 24.0, 20.0, 12.0, 17.0, 12.0, 11.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.1015625, -9.86602783203125, -9.6304931640625, -9.39495849609375, -9.159423828125, -8.92388916015625, -8.6883544921875, -8.45281982421875, -8.21728515625, -7.98175048828125, -7.7462158203125, -7.51068115234375, -7.275146484375, -7.03961181640625, -6.8040771484375, -6.56854248046875, -6.3330078125, -6.09747314453125, -5.8619384765625, -5.62640380859375, -5.390869140625, -5.15533447265625, -4.9197998046875, -4.68426513671875, -4.44873046875, -4.21319580078125, -3.9776611328125, -3.74212646484375, -3.506591796875, -3.27105712890625, -3.0355224609375, -2.79998779296875, -2.564453125, -2.32891845703125, -2.0933837890625, -1.85784912109375, -1.622314453125, -1.38677978515625, -1.1512451171875, -0.91571044921875, -0.68017578125, -0.44464111328125, -0.2091064453125, 0.02642822265625, 0.261962890625, 0.49749755859375, 0.7330322265625, 0.96856689453125, 1.2041015625, 1.43963623046875, 1.6751708984375, 1.91070556640625, 2.146240234375, 2.38177490234375, 2.6173095703125, 2.85284423828125, 3.08837890625, 3.32391357421875, 3.5594482421875, 3.79498291015625, 4.030517578125, 4.26605224609375, 4.5015869140625, 4.73712158203125, 4.97265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 3.0, 6.0, 11.0, 17.0, 18.0, 22.0, 25.0, 50.0, 60.0, 87.0, 142.0, 209.0, 325.0, 596.0, 1232.0, 3456.0, 16900.0, 309702.0, 683680.0, 24310.0, 4491.0, 1480.0, 686.0, 325.0, 209.0, 162.0, 91.0, 63.0, 45.0, 39.0, 27.0, 20.0, 9.0, 8.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.59375, -15.16162109375, -14.7294921875, -14.29736328125, -13.865234375, -13.43310546875, -13.0009765625, -12.56884765625, -12.13671875, -11.70458984375, -11.2724609375, -10.84033203125, -10.408203125, -9.97607421875, -9.5439453125, -9.11181640625, -8.6796875, -8.24755859375, -7.8154296875, -7.38330078125, -6.951171875, -6.51904296875, -6.0869140625, -5.65478515625, -5.22265625, -4.79052734375, -4.3583984375, -3.92626953125, -3.494140625, -3.06201171875, -2.6298828125, -2.19775390625, -1.765625, -1.33349609375, -0.9013671875, -0.46923828125, -0.037109375, 0.39501953125, 0.8271484375, 1.25927734375, 1.69140625, 2.12353515625, 2.5556640625, 2.98779296875, 3.419921875, 3.85205078125, 4.2841796875, 4.71630859375, 5.1484375, 5.58056640625, 6.0126953125, 6.44482421875, 6.876953125, 7.30908203125, 7.7412109375, 8.17333984375, 8.60546875, 9.03759765625, 9.4697265625, 9.90185546875, 10.333984375, 10.76611328125, 11.1982421875, 11.63037109375, 12.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 6.0, 13.0, 8.0, 8.0, 9.0, 22.0, 18.0, 15.0, 26.0, 26.0, 33.0, 44.0, 49.0, 69.0, 74.0, 95.0, 91.0, 69.0, 50.0, 43.0, 48.0, 30.0, 27.0, 15.0, 19.0, 19.0, 12.0, 12.0, 8.0, 11.0, 6.0, 5.0, 0.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.375, -27.554931640625, -26.73486328125, -25.914794921875, -25.0947265625, -24.274658203125, -23.45458984375, -22.634521484375, -21.814453125, -20.994384765625, -20.17431640625, -19.354248046875, -18.5341796875, -17.714111328125, -16.89404296875, -16.073974609375, -15.25390625, -14.433837890625, -13.61376953125, -12.793701171875, -11.9736328125, -11.153564453125, -10.33349609375, -9.513427734375, -8.693359375, -7.873291015625, -7.05322265625, -6.233154296875, -5.4130859375, -4.593017578125, -3.77294921875, -2.952880859375, -2.1328125, -1.312744140625, -0.49267578125, 0.327392578125, 1.1474609375, 1.967529296875, 2.78759765625, 3.607666015625, 4.427734375, 5.247802734375, 6.06787109375, 6.887939453125, 7.7080078125, 8.528076171875, 9.34814453125, 10.168212890625, 10.98828125, 11.808349609375, 12.62841796875, 13.448486328125, 14.2685546875, 15.088623046875, 15.90869140625, 16.728759765625, 17.548828125, 18.368896484375, 19.18896484375, 20.009033203125, 20.8291015625, 21.649169921875, 22.46923828125, 23.289306640625, 24.109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 15.0, 16.0, 21.0, 31.0, 36.0, 40.0, 89.0, 110.0, 187.0, 286.0, 432.0, 842.0, 1576.0, 3432.0, 8656.0, 28058.0, 236348.0, 716511.0, 34043.0, 9933.0, 3765.0, 1798.0, 858.0, 498.0, 275.0, 174.0, 133.0, 95.0, 40.0, 40.0, 38.0, 23.0, 24.0, 19.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-1.65234375, -1.6023712158203125, -1.552398681640625, -1.5024261474609375, -1.45245361328125, -1.4024810791015625, -1.352508544921875, -1.3025360107421875, -1.2525634765625, -1.2025909423828125, -1.152618408203125, -1.1026458740234375, -1.05267333984375, -1.0027008056640625, -0.952728271484375, -0.9027557373046875, -0.852783203125, -0.8028106689453125, -0.752838134765625, -0.7028656005859375, -0.65289306640625, -0.6029205322265625, -0.552947998046875, -0.5029754638671875, -0.4530029296875, -0.4030303955078125, -0.353057861328125, -0.3030853271484375, -0.25311279296875, -0.2031402587890625, -0.153167724609375, -0.1031951904296875, -0.05322265625, -0.0032501220703125, 0.046722412109375, 0.0966949462890625, 0.14666748046875, 0.1966400146484375, 0.246612548828125, 0.2965850830078125, 0.3465576171875, 0.3965301513671875, 0.446502685546875, 0.4964752197265625, 0.54644775390625, 0.5964202880859375, 0.646392822265625, 0.6963653564453125, 0.746337890625, 0.7963104248046875, 0.846282958984375, 0.8962554931640625, 0.94622802734375, 0.9962005615234375, 1.046173095703125, 1.0961456298828125, 1.1461181640625, 1.1960906982421875, 1.246063232421875, 1.2960357666015625, 1.34600830078125, 1.3959808349609375, 1.445953369140625, 1.4959259033203125, 1.5458984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 12.0, 29.0, 28.0, 37.0, 62.0, 110.0, 192.0, 192.0, 119.0, 59.0, 34.0, 21.0, 18.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008893013000488281, -0.0008623376488685608, -0.0008353739976882935, -0.0008084103465080261, -0.0007814466953277588, -0.0007544830441474915, -0.0007275193929672241, -0.0007005557417869568, -0.0006735920906066895, -0.0006466284394264221, -0.0006196647882461548, -0.0005927011370658875, -0.0005657374858856201, -0.0005387738347053528, -0.0005118101835250854, -0.0004848465323448181, -0.0004578828811645508, -0.00043091922998428345, -0.0004039555788040161, -0.0003769919276237488, -0.00035002827644348145, -0.0003230646252632141, -0.0002961009740829468, -0.00026913732290267944, -0.0002421736717224121, -0.00021521002054214478, -0.00018824636936187744, -0.0001612827181816101, -0.00013431906700134277, -0.00010735541582107544, -8.03917646408081e-05, -5.342811346054077e-05, -2.6464462280273438e-05, 4.991888999938965e-07, 2.746284008026123e-05, 5.4426491260528564e-05, 8.13901424407959e-05, 0.00010835379362106323, 0.00013531744480133057, 0.0001622810959815979, 0.00018924474716186523, 0.00021620839834213257, 0.0002431720495223999, 0.00027013570070266724, 0.00029709935188293457, 0.0003240630030632019, 0.00035102665424346924, 0.00037799030542373657, 0.0004049539566040039, 0.00043191760778427124, 0.0004588812589645386, 0.0004858449101448059, 0.0005128085613250732, 0.0005397722125053406, 0.0005667358636856079, 0.0005936995148658752, 0.0006206631660461426, 0.0006476268172264099, 0.0006745904684066772, 0.0007015541195869446, 0.0007285177707672119, 0.0007554814219474792, 0.0007824450731277466, 0.0008094087243080139, 0.0008363723754882812]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 34.0, 55.0, 84.0, 127.0, 214.0, 419.0, 809.0, 1682.0, 3844.0, 10577.0, 35167.0, 507871.0, 435746.0, 34371.0, 10183.0, 3868.0, 1687.0, 782.0, 401.0, 229.0, 132.0, 67.0, 53.0, 34.0, 16.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.7294464111328125, -1.671783447265625, -1.6141204833984375, -1.55645751953125, -1.4987945556640625, -1.441131591796875, -1.3834686279296875, -1.3258056640625, -1.2681427001953125, -1.210479736328125, -1.1528167724609375, -1.09515380859375, -1.0374908447265625, -0.979827880859375, -0.9221649169921875, -0.864501953125, -0.8068389892578125, -0.749176025390625, -0.6915130615234375, -0.63385009765625, -0.5761871337890625, -0.518524169921875, -0.4608612060546875, -0.4031982421875, -0.3455352783203125, -0.287872314453125, -0.2302093505859375, -0.17254638671875, -0.1148834228515625, -0.057220458984375, 0.0004425048828125, 0.05810546875, 0.1157684326171875, 0.173431396484375, 0.2310943603515625, 0.28875732421875, 0.3464202880859375, 0.404083251953125, 0.4617462158203125, 0.5194091796875, 0.5770721435546875, 0.634735107421875, 0.6923980712890625, 0.75006103515625, 0.8077239990234375, 0.865386962890625, 0.9230499267578125, 0.980712890625, 1.0383758544921875, 1.096038818359375, 1.1537017822265625, 1.21136474609375, 1.2690277099609375, 1.326690673828125, 1.3843536376953125, 1.4420166015625, 1.4996795654296875, 1.557342529296875, 1.6150054931640625, 1.67266845703125, 1.7303314208984375, 1.787994384765625, 1.8456573486328125, 1.9033203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 10.0, 5.0, 3.0, 12.0, 5.0, 6.0, 19.0, 22.0, 17.0, 37.0, 45.0, 64.0, 107.0, 106.0, 119.0, 113.0, 81.0, 58.0, 34.0, 28.0, 17.0, 18.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.107421875, -2.0442047119140625, -1.980987548828125, -1.9177703857421875, -1.85455322265625, -1.7913360595703125, -1.728118896484375, -1.6649017333984375, -1.6016845703125, -1.5384674072265625, -1.475250244140625, -1.4120330810546875, -1.34881591796875, -1.2855987548828125, -1.222381591796875, -1.1591644287109375, -1.095947265625, -1.0327301025390625, -0.969512939453125, -0.9062957763671875, -0.84307861328125, -0.7798614501953125, -0.716644287109375, -0.6534271240234375, -0.5902099609375, -0.5269927978515625, -0.463775634765625, -0.4005584716796875, -0.33734130859375, -0.2741241455078125, -0.210906982421875, -0.1476898193359375, -0.08447265625, -0.0212554931640625, 0.041961669921875, 0.1051788330078125, 0.16839599609375, 0.2316131591796875, 0.294830322265625, 0.3580474853515625, 0.4212646484375, 0.4844818115234375, 0.547698974609375, 0.6109161376953125, 0.67413330078125, 0.7373504638671875, 0.800567626953125, 0.8637847900390625, 0.927001953125, 0.9902191162109375, 1.053436279296875, 1.1166534423828125, 1.17987060546875, 1.2430877685546875, 1.306304931640625, 1.3695220947265625, 1.4327392578125, 1.4959564208984375, 1.559173583984375, 1.6223907470703125, 1.68560791015625, 1.7488250732421875, 1.812042236328125, 1.8752593994140625, 1.9384765625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 11.0, 19.0, 37.0, 70.0, 160.0, 493.0, 98.0, 41.0, 32.0, 18.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-153.13253784179688, -149.51748657226562, -145.90245056152344, -142.2873992919922, -138.67236328125, -135.05731201171875, -131.4422607421875, -127.82722473144531, -124.21217346191406, -120.59712982177734, -116.98208618164062, -113.36703491210938, -109.75199127197266, -106.13694763183594, -102.52190399169922, -98.9068603515625, -95.29181671142578, -91.67677307128906, -88.06172943115234, -84.44668579101562, -80.83163452148438, -77.21659088134766, -73.60154724121094, -69.98650360107422, -66.3714599609375, -62.75641632080078, -59.1413688659668, -55.52632522583008, -51.911277770996094, -48.296234130859375, -44.681190490722656, -41.06614685058594, -37.45109558105469, -33.83605194091797, -30.221004486083984, -26.605960845947266, -22.990915298461914, -19.375869750976562, -15.760826110839844, -12.145780563354492, -8.53073501586914, -4.915689945220947, -1.300644874572754, 2.3143997192382812, 5.929445266723633, 9.544490814208984, 13.159534454345703, 16.774580001831055, 20.389625549316406, 24.004671096801758, 27.61971664428711, 31.234760284423828, 34.84980773925781, 38.46485137939453, 42.07989501953125, 45.69493865966797, 49.30998611450195, 52.92502975463867, 56.540077209472656, 60.155120849609375, 63.770164489746094, 67.38520812988281, 71.00025939941406, 74.61530303955078, 78.2303466796875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 10.0, 15.0, 20.0, 19.0, 15.0, 17.0, 24.0, 18.0, 39.0, 102.0, 137.0, 152.0, 124.0, 42.0, 26.0, 22.0, 24.0, 17.0, 24.0, 13.0, 14.0, 10.0, 8.0, 14.0, 8.0, 7.0, 6.0, 3.0, 7.0, 2.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.59358215332031, -68.57595825195312, -66.55833435058594, -64.54070281982422, -62.52307891845703, -60.505455017089844, -58.48782730102539, -56.47019958496094, -54.45257568359375, -52.43495178222656, -50.41732406616211, -48.399696350097656, -46.38207244873047, -44.36444854736328, -42.34682083129883, -40.329193115234375, -38.31156921386719, -36.2939453125, -34.27631759643555, -32.258689880371094, -30.241065979003906, -28.223440170288086, -26.205814361572266, -24.188188552856445, -22.170562744140625, -20.152936935424805, -18.135311126708984, -16.117685317993164, -14.100059509277344, -12.082433700561523, -10.064807891845703, -8.047182083129883, -6.029563903808594, -4.011938095092773, -1.9943122863769531, 0.023313522338867188, 2.0409393310546875, 4.058565139770508, 6.076190948486328, 8.093816757202148, 10.111442565917969, 12.129068374633789, 14.14669418334961, 16.16431999206543, 18.18194580078125, 20.19957160949707, 22.21719741821289, 24.23482322692871, 26.25244903564453, 28.27007484436035, 30.287700653076172, 32.305328369140625, 34.32295227050781, 36.340576171875, 38.35820388793945, 40.375831604003906, 42.393455505371094, 44.41107940673828, 46.428707122802734, 48.44633483886719, 50.463958740234375, 52.48158264160156, 54.499210357666016, 56.51683807373047, 58.534461975097656]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 15.0, 16.0, 23.0, 30.0, 38.0, 53.0, 63.0, 180.0, 282.0, 62.0, 50.0, 49.0, 31.0, 35.0, 13.0, 17.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.890625, -14.5601806640625, -14.229736328125, -13.8992919921875, -13.56884765625, -13.2384033203125, -12.907958984375, -12.5775146484375, -12.2470703125, -11.9166259765625, -11.586181640625, -11.2557373046875, -10.92529296875, -10.5948486328125, -10.264404296875, -9.9339599609375, -9.603515625, -9.2730712890625, -8.942626953125, -8.6121826171875, -8.28173828125, -7.9512939453125, -7.620849609375, -7.2904052734375, -6.9599609375, -6.6295166015625, -6.299072265625, -5.9686279296875, -5.63818359375, -5.3077392578125, -4.977294921875, -4.6468505859375, -4.31640625, -3.9859619140625, -3.655517578125, -3.3250732421875, -2.99462890625, -2.6641845703125, -2.333740234375, -2.0032958984375, -1.6728515625, -1.3424072265625, -1.011962890625, -0.6815185546875, -0.35107421875, -0.0206298828125, 0.309814453125, 0.6402587890625, 0.970703125, 1.3011474609375, 1.631591796875, 1.9620361328125, 2.29248046875, 2.6229248046875, 2.953369140625, 3.2838134765625, 3.6142578125, 3.9447021484375, 4.275146484375, 4.6055908203125, 4.93603515625, 5.2664794921875, 5.596923828125, 5.9273681640625, 6.2578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 4.0, 10.0, 18.0, 27.0, 38.0, 63.0, 114.0, 211.0, 444.0, 1582.0, 9004.0, 8345523.0, 27309.0, 2810.0, 760.0, 259.0, 137.0, 78.0, 44.0, 53.0, 18.0, 20.0, 9.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.94425201416016, -85.2537841796875, -82.56331634521484, -79.87284851074219, -77.18238067626953, -74.49191284179688, -71.80144500732422, -69.11097717285156, -66.4205093383789, -63.73004150390625, -61.039573669433594, -58.34910583496094, -55.65863800048828, -52.968170166015625, -50.27770233154297, -47.58723449707031, -44.896766662597656, -42.206298828125, -39.515830993652344, -36.82536315917969, -34.13489532470703, -31.444427490234375, -28.75395965576172, -26.063491821289062, -23.373023986816406, -20.68255615234375, -17.992088317871094, -15.301620483398438, -12.611152648925781, -9.920684814453125, -7.230216979980469, -4.5397491455078125, -1.849273681640625, 0.8411941528320312, 3.5316619873046875, 6.222129821777344, 8.91259765625, 11.603065490722656, 14.293533325195312, 16.98400115966797, 19.674468994140625, 22.36493682861328, 25.055404663085938, 27.745872497558594, 30.43634033203125, 33.126808166503906, 35.81727600097656, 38.50774383544922, 41.198211669921875, 43.88867950439453, 46.57914733886719, 49.269615173339844, 51.9600830078125, 54.650550842285156, 57.34101867675781, 60.03148651123047, 62.721954345703125, 65.41242218017578, 68.10289001464844, 70.7933578491211, 73.48382568359375, 76.1742935180664, 78.86476135253906, 81.55522918701172, 84.24569702148438]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 7.0, 5.0, 9.0, 5.0, 3.0, 5.0, 6.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 7.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.10792541503906, -154.2130584716797, -149.31817626953125, -144.42330932617188, -139.5284423828125, -134.63357543945312, -129.7386932373047, -124.84382629394531, -119.9489517211914, -115.0540771484375, -110.15921020507812, -105.26433563232422, -100.36946105957031, -95.47459411621094, -90.57971954345703, -85.68484497070312, -80.78997802734375, -75.89510345458984, -71.00023651123047, -66.10536193847656, -61.21049118041992, -56.31562042236328, -51.420745849609375, -46.525875091552734, -41.631004333496094, -36.73613357543945, -31.84126091003418, -26.946388244628906, -22.051517486572266, -17.156646728515625, -12.261774063110352, -7.366901397705078, -2.4720458984375, 2.422825813293457, 7.317697525024414, 12.212569236755371, 17.107440948486328, 22.00231170654297, 26.897184371948242, 31.792057037353516, 36.686927795410156, 41.5817985534668, 46.47666931152344, 51.371543884277344, 56.266414642333984, 61.161285400390625, 66.05615997314453, 70.95103454589844, 75.84590148925781, 80.74077606201172, 85.6356430053711, 90.530517578125, 95.42538452148438, 100.32025909423828, 105.21513366699219, 110.11000061035156, 115.00487518310547, 119.89974975585938, 124.79461669921875, 129.68948364257812, 134.58436584472656, 139.47923278808594, 144.3740997314453, 149.26898193359375, 154.16384887695312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 21.0, 28.0, 36.0, 78.0, 73.0, 176.0, 270.0, 476.0, 902.0, 1887.0, 4420.0, 12349.0, 37975.0, 125270.0, 212674.0, 85924.0, 26423.0, 8819.0, 3320.0, 1504.0, 699.0, 372.0, 201.0, 134.0, 67.0, 50.0, 29.0, 23.0, 17.0, 5.0, 9.0, 1.0, 0.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.90625, -61.1259765625, -59.345703125, -57.5654296875, -55.78515625, -54.0048828125, -52.224609375, -50.4443359375, -48.6640625, -46.8837890625, -45.103515625, -43.3232421875, -41.54296875, -39.7626953125, -37.982421875, -36.2021484375, -34.421875, -32.6416015625, -30.861328125, -29.0810546875, -27.30078125, -25.5205078125, -23.740234375, -21.9599609375, -20.1796875, -18.3994140625, -16.619140625, -14.8388671875, -13.05859375, -11.2783203125, -9.498046875, -7.7177734375, -5.9375, -4.1572265625, -2.376953125, -0.5966796875, 1.18359375, 2.9638671875, 4.744140625, 6.5244140625, 8.3046875, 10.0849609375, 11.865234375, 13.6455078125, 15.42578125, 17.2060546875, 18.986328125, 20.7666015625, 22.546875, 24.3271484375, 26.107421875, 27.8876953125, 29.66796875, 31.4482421875, 33.228515625, 35.0087890625, 36.7890625, 38.5693359375, 40.349609375, 42.1298828125, 43.91015625, 45.6904296875, 47.470703125, 49.2509765625, 51.03125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 20.0, 29.0, 45.0, 59.0, 80.0, 100.0, 127.0, 133.0, 81.0, 78.0, 63.0, 45.0, 37.0, 20.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.611328125, -10.24609375, -9.880859375, -9.515625, -9.150390625, -8.78515625, -8.419921875, -8.0546875, -7.689453125, -7.32421875, -6.958984375, -6.59375, -6.228515625, -5.86328125, -5.498046875, -5.1328125, -4.767578125, -4.40234375, -4.037109375, -3.671875, -3.306640625, -2.94140625, -2.576171875, -2.2109375, -1.845703125, -1.48046875, -1.115234375, -0.75, -0.384765625, -0.01953125, 0.345703125, 0.7109375, 1.076171875, 1.44140625, 1.806640625, 2.171875, 2.537109375, 2.90234375, 3.267578125, 3.6328125, 3.998046875, 4.36328125, 4.728515625, 5.09375, 5.458984375, 5.82421875, 6.189453125, 6.5546875, 6.919921875, 7.28515625, 7.650390625, 8.015625, 8.380859375, 8.74609375, 9.111328125, 9.4765625, 9.841796875, 10.20703125, 10.572265625, 10.9375, 11.302734375, 11.66796875, 12.033203125, 12.3984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 6.0, 7.0, 4.0, 15.0, 25.0, 14.0, 31.0, 65.0, 58.0, 75.0, 59.0, 34.0, 27.0, 18.0, 3.0, 8.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.72188949584961, -53.93724060058594, -52.152591705322266, -50.367942810058594, -48.58329391479492, -46.79864501953125, -45.01399230957031, -43.229347229003906, -41.44469451904297, -39.6600456237793, -37.875396728515625, -36.09074783325195, -34.30609893798828, -32.52145004272461, -30.736799240112305, -28.952150344848633, -27.167503356933594, -25.382854461669922, -23.59820556640625, -21.813556671142578, -20.028907775878906, -18.244258880615234, -16.45960807800293, -14.674959182739258, -12.890310287475586, -11.105661392211914, -9.321012496948242, -7.536362648010254, -5.751713752746582, -3.96706485748291, -2.182415008544922, -0.39776611328125, 1.3868827819824219, 3.171531915664673, 4.956181049346924, 6.740830421447754, 8.525479316711426, 10.310128211975098, 12.094778060913086, 13.879426956176758, 15.66407585144043, 17.4487247467041, 19.233373641967773, 21.018024444580078, 22.80267333984375, 24.587322235107422, 26.371971130371094, 28.156620025634766, 29.941268920898438, 31.72591781616211, 33.51056671142578, 35.29521560668945, 37.079864501953125, 38.8645133972168, 40.64916229248047, 42.433815002441406, 44.21846008300781, 46.003108978271484, 47.787757873535156, 49.57240676879883, 51.3570556640625, 53.14170455932617, 54.926353454589844, 56.71100616455078, 58.49565505981445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 8.0, 16.0, 9.0, 19.0, 37.0, 55.0, 71.0, 70.0, 65.0, 43.0, 17.0, 15.0, 9.0, 5.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.547569274902344, -40.342533111572266, -39.13750076293945, -37.932464599609375, -36.72743225097656, -35.522396087646484, -34.317359924316406, -33.112327575683594, -31.907291412353516, -30.70225715637207, -29.497222900390625, -28.292186737060547, -27.0871524810791, -25.882118225097656, -24.677082061767578, -23.472047805786133, -22.267013549804688, -21.061979293823242, -19.856945037841797, -18.65190887451172, -17.446874618530273, -16.241840362548828, -15.036805152893066, -13.831769943237305, -12.62673568725586, -11.421701431274414, -10.216666221618652, -9.01163101196289, -7.806596755981445, -6.601562023162842, -5.396527290344238, -4.191492080688477, -2.9864578247070312, -1.7814230918884277, -0.5763883590698242, 0.6286463737487793, 1.8336811065673828, 3.0387158393859863, 4.24375057220459, 5.448785781860352, 6.653820037841797, 7.8588547706604, 9.063889503479004, 10.268924713134766, 11.473958969116211, 12.678993225097656, 13.884028434753418, 15.08906364440918, 16.294097900390625, 17.49913215637207, 18.704166412353516, 19.909202575683594, 21.11423683166504, 22.319271087646484, 23.524307250976562, 24.729341506958008, 25.934375762939453, 27.1394100189209, 28.344444274902344, 29.549480438232422, 30.754514694213867, 31.959548950195312, 33.16458511352539, 34.36962127685547, 35.57465362548828]}, "eval/loss": 1.8364678621292114, "eval/wer": 0.2812376041253471, "eval/runtime": 832.195, "eval/samples_per_second": 3.175, "eval/steps_per_second": 0.398, "train/train_runtime": 108037.8512, "train/train_samples_per_second": 5.283, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 2.302149100206905} \ No newline at end of file