diff --git a/model_card/layer_images/layer_0_attention_output_dense.png b/model_card/layer_images/layer_0_attention_output_dense.png index 272010bff3998ff98d9094116b9f4b6cd8a44854..893952b868791bf372c799456283ba80ccae9a08 100644 Binary files a/model_card/layer_images/layer_0_attention_output_dense.png and b/model_card/layer_images/layer_0_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_0_attention_self_key.png b/model_card/layer_images/layer_0_attention_self_key.png index b475f1b28d4ffd4bfc0a75ffbb711651784a08b9..c46104906096553e053e287b9dcf68fd7cfc58ab 100644 Binary files a/model_card/layer_images/layer_0_attention_self_key.png and b/model_card/layer_images/layer_0_attention_self_key.png differ diff --git a/model_card/layer_images/layer_0_attention_self_query.png b/model_card/layer_images/layer_0_attention_self_query.png index 1223393bce9b9fc8ce7c9273cee7cf4de4a38f0d..797f2f89e011df4c57a34e7275ed52a259d4288c 100644 Binary files a/model_card/layer_images/layer_0_attention_self_query.png and b/model_card/layer_images/layer_0_attention_self_query.png differ diff --git a/model_card/layer_images/layer_0_attention_self_value.png b/model_card/layer_images/layer_0_attention_self_value.png index 6313ac0382780df8cf9e6b93d4560ed6014ca1be..309d10eed8412216855e5257e91bfa89886b90f5 100644 Binary files a/model_card/layer_images/layer_0_attention_self_value.png and b/model_card/layer_images/layer_0_attention_self_value.png differ diff --git a/model_card/layer_images/layer_0_intermediate_dense.png b/model_card/layer_images/layer_0_intermediate_dense.png index 1f9829ba6f4982d3e3a9113357d4d03376e09e76..04ea38b48e10966e66e30916f2d7038cb708a99f 100644 Binary files a/model_card/layer_images/layer_0_intermediate_dense.png and b/model_card/layer_images/layer_0_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_0_output_dense.png b/model_card/layer_images/layer_0_output_dense.png index 9ba82c38dc1f1e9ff040d8848bb20503f4e3e1bc..89e34cb8ea07d52ba5b3cbc7e4ad64e76cc3b6a4 100644 Binary files a/model_card/layer_images/layer_0_output_dense.png and b/model_card/layer_images/layer_0_output_dense.png differ diff --git a/model_card/layer_images/layer_10_attention_output_dense.png b/model_card/layer_images/layer_10_attention_output_dense.png index 65a8f0f5e31786e4a49186832f80da02ac5da9f6..6cf668d4298af3558a79e592818f385c5ed0b82e 100644 Binary files a/model_card/layer_images/layer_10_attention_output_dense.png and b/model_card/layer_images/layer_10_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_10_attention_self_key.png b/model_card/layer_images/layer_10_attention_self_key.png index fe7a46e8e28532a66f5d89178acce7bb680acd5b..72c1f7351a4d624840fbb990f462ef836a6059c7 100644 Binary files a/model_card/layer_images/layer_10_attention_self_key.png and b/model_card/layer_images/layer_10_attention_self_key.png differ diff --git a/model_card/layer_images/layer_10_attention_self_query.png b/model_card/layer_images/layer_10_attention_self_query.png index ac7f5b74385941878b74b4d2e4cbb858adeadbda..d12b599647f1aab57d863b9bdd9be3c9d6257e14 100644 Binary files a/model_card/layer_images/layer_10_attention_self_query.png and b/model_card/layer_images/layer_10_attention_self_query.png differ diff --git a/model_card/layer_images/layer_10_attention_self_value.png b/model_card/layer_images/layer_10_attention_self_value.png index 7a151c6abae73339a7aed088d42b992b275f52b2..0e40dbc566fa87e1cd11a0c66d3bc8de29ca39e9 100644 Binary files a/model_card/layer_images/layer_10_attention_self_value.png and b/model_card/layer_images/layer_10_attention_self_value.png differ diff --git a/model_card/layer_images/layer_10_intermediate_dense.png b/model_card/layer_images/layer_10_intermediate_dense.png index 790423093355d6c6556c7dadf32bafda7f0abcac..56e778c898350bff306c3b046fe8abf21710e4a3 100644 Binary files a/model_card/layer_images/layer_10_intermediate_dense.png and b/model_card/layer_images/layer_10_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_10_output_dense.png b/model_card/layer_images/layer_10_output_dense.png index 3fc8da74cfc240a5a33547a59cdf36602eaac2f5..e040d01bcd7eebaca3d3df77b8d29547c8b220b4 100644 Binary files a/model_card/layer_images/layer_10_output_dense.png and b/model_card/layer_images/layer_10_output_dense.png differ diff --git a/model_card/layer_images/layer_11_attention_output_dense.png b/model_card/layer_images/layer_11_attention_output_dense.png index 7c1ffd47f14950bfe9afac21b5f655f07c3857e3..aada9ba230a42106a6acd87d7bf378ed00006f0c 100644 Binary files a/model_card/layer_images/layer_11_attention_output_dense.png and b/model_card/layer_images/layer_11_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_11_attention_self_key.png b/model_card/layer_images/layer_11_attention_self_key.png index b74e59a3a6f4b24eeda57920bc263d79bb1c4e65..2a66df922a55db74b968c950e6214be37689316a 100644 Binary files a/model_card/layer_images/layer_11_attention_self_key.png and b/model_card/layer_images/layer_11_attention_self_key.png differ diff --git a/model_card/layer_images/layer_11_attention_self_query.png b/model_card/layer_images/layer_11_attention_self_query.png index b9ca1fcfeb21b0c6bd67140d1a6742abdd400718..b3545ef97f2e391aa77e8856bec94111976bfa7d 100644 Binary files a/model_card/layer_images/layer_11_attention_self_query.png and b/model_card/layer_images/layer_11_attention_self_query.png differ diff --git a/model_card/layer_images/layer_11_attention_self_value.png b/model_card/layer_images/layer_11_attention_self_value.png index 2f2f6a2a7ac60db90d2b630e3bcf06ee37ae9ed6..2d6f7f3a1b6ba69f7ec94fd0941f3f11130ebb6a 100644 Binary files a/model_card/layer_images/layer_11_attention_self_value.png and b/model_card/layer_images/layer_11_attention_self_value.png differ diff --git a/model_card/layer_images/layer_11_intermediate_dense.png b/model_card/layer_images/layer_11_intermediate_dense.png index f03084b9fcf7ca89aec12ae344f1022a76cb963e..711926c63f064db97e795f3742697b2878a720af 100644 Binary files a/model_card/layer_images/layer_11_intermediate_dense.png and b/model_card/layer_images/layer_11_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_11_output_dense.png b/model_card/layer_images/layer_11_output_dense.png index 346ed41b05918fd10047eef3aae1cee2d6a9f8fe..eb698e5338838c8c3b9312a3b8d5c1c5126fee51 100644 Binary files a/model_card/layer_images/layer_11_output_dense.png and b/model_card/layer_images/layer_11_output_dense.png differ diff --git a/model_card/layer_images/layer_1_attention_output_dense.png b/model_card/layer_images/layer_1_attention_output_dense.png index d1ec42dd0aa27c1688846a644d8d4eca033e8981..3f008d1b9488af65e1336915caf217ff26e0e897 100644 Binary files a/model_card/layer_images/layer_1_attention_output_dense.png and b/model_card/layer_images/layer_1_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_1_attention_self_key.png b/model_card/layer_images/layer_1_attention_self_key.png index 2c758996da1c9d39f9c7c727dfc37118e5cafecf..8dede4a20330ee2bef2a22f7462136199b4fe2a5 100644 Binary files a/model_card/layer_images/layer_1_attention_self_key.png and b/model_card/layer_images/layer_1_attention_self_key.png differ diff --git a/model_card/layer_images/layer_1_attention_self_query.png b/model_card/layer_images/layer_1_attention_self_query.png index 7f0efe65c6b657c6f3d3829193bbd10e726baf76..66bfbc059d0cb9f09a32e78f2412dfec48c311f5 100644 Binary files a/model_card/layer_images/layer_1_attention_self_query.png and b/model_card/layer_images/layer_1_attention_self_query.png differ diff --git a/model_card/layer_images/layer_1_attention_self_value.png b/model_card/layer_images/layer_1_attention_self_value.png index 498946fc8f40a60f8bfac9c6462a4dbf40e82407..8262e5030efe5badbc7368af4311efadd7ef52f2 100644 Binary files a/model_card/layer_images/layer_1_attention_self_value.png and b/model_card/layer_images/layer_1_attention_self_value.png differ diff --git a/model_card/layer_images/layer_1_intermediate_dense.png b/model_card/layer_images/layer_1_intermediate_dense.png index e983f202011a98edf4e2106e05a81115f3decfe3..7d393a9d08fc7b148b4afa67176569996557a67f 100644 Binary files a/model_card/layer_images/layer_1_intermediate_dense.png and b/model_card/layer_images/layer_1_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_1_output_dense.png b/model_card/layer_images/layer_1_output_dense.png index babaea59ad2ea17fbd220630618c2430a8304f1f..b75d2c1e24f85cb80e1e86d41074c8f9f2666053 100644 Binary files a/model_card/layer_images/layer_1_output_dense.png and b/model_card/layer_images/layer_1_output_dense.png differ diff --git a/model_card/layer_images/layer_2_attention_output_dense.png b/model_card/layer_images/layer_2_attention_output_dense.png index fd99d7f7aac82a2db5628fcf51c23d44d74f758d..4d275d25c0ef840bd16502d4948c76126af24c0d 100644 Binary files a/model_card/layer_images/layer_2_attention_output_dense.png and b/model_card/layer_images/layer_2_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_2_attention_self_key.png b/model_card/layer_images/layer_2_attention_self_key.png index 8602939902157e379f3fa01931b5e11383bf8654..d29fa554394c8d06b5777e0623dc8fce752b6165 100644 Binary files a/model_card/layer_images/layer_2_attention_self_key.png and b/model_card/layer_images/layer_2_attention_self_key.png differ diff --git a/model_card/layer_images/layer_2_attention_self_query.png b/model_card/layer_images/layer_2_attention_self_query.png index 57241cb9a44c6b6f47a556ea4be7e574fe5e8d78..0bd1836388a1d42183ba44638fed1152024e204a 100644 Binary files a/model_card/layer_images/layer_2_attention_self_query.png and b/model_card/layer_images/layer_2_attention_self_query.png differ diff --git a/model_card/layer_images/layer_2_attention_self_value.png b/model_card/layer_images/layer_2_attention_self_value.png index 7e8c3bf9c99d527e674bb456d1f12a8cbdbe9da3..cb8f3d5857eae6b39ef47f2c1d80b9ff7932150e 100644 Binary files a/model_card/layer_images/layer_2_attention_self_value.png and b/model_card/layer_images/layer_2_attention_self_value.png differ diff --git a/model_card/layer_images/layer_2_intermediate_dense.png b/model_card/layer_images/layer_2_intermediate_dense.png index 52330e6e65eebf2c84ed7e7d7b6b92e66eff1dab..7f06e55ab2ba69a162edf9b5ef3bb6635156879c 100644 Binary files a/model_card/layer_images/layer_2_intermediate_dense.png and b/model_card/layer_images/layer_2_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_2_output_dense.png b/model_card/layer_images/layer_2_output_dense.png index 5e5a9b865607cb590d9272e8e27067e9a53a7fe2..17383c1c4278a1b0739daf23c2db99dc7bfb0919 100644 Binary files a/model_card/layer_images/layer_2_output_dense.png and b/model_card/layer_images/layer_2_output_dense.png differ diff --git a/model_card/layer_images/layer_3_attention_output_dense.png b/model_card/layer_images/layer_3_attention_output_dense.png index efc2eefb93d0ec8de4c5d47861c59ccdbc9d6d62..de845d7b192c25e1a1e44da636af98855461b8b8 100644 Binary files a/model_card/layer_images/layer_3_attention_output_dense.png and b/model_card/layer_images/layer_3_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_3_attention_self_key.png b/model_card/layer_images/layer_3_attention_self_key.png index 16d71f68ae1fd15dab918c77385abf746f6bf579..3e7acdb4ad560bd95235c24961b9ba80e935d359 100644 Binary files a/model_card/layer_images/layer_3_attention_self_key.png and b/model_card/layer_images/layer_3_attention_self_key.png differ diff --git a/model_card/layer_images/layer_3_attention_self_query.png b/model_card/layer_images/layer_3_attention_self_query.png index 4bffde1580b6d85ad69ee41a4e55c85b3b2cc30a..3fc15dbbab6a5d6ee7702dc57590fe4e7b4dc5ac 100644 Binary files a/model_card/layer_images/layer_3_attention_self_query.png and b/model_card/layer_images/layer_3_attention_self_query.png differ diff --git a/model_card/layer_images/layer_3_attention_self_value.png b/model_card/layer_images/layer_3_attention_self_value.png index 510f46c24eb705829318dc72ca9c4383bc280782..6882304b2c36d7beee1e082a2555ade065e74a0d 100644 Binary files a/model_card/layer_images/layer_3_attention_self_value.png and b/model_card/layer_images/layer_3_attention_self_value.png differ diff --git a/model_card/layer_images/layer_3_intermediate_dense.png b/model_card/layer_images/layer_3_intermediate_dense.png index 6e5eb63562a851e73db1d4c8d9d3485f590c5997..599dc305efe92ecfadd90f89c5e84b6b525a295e 100644 Binary files a/model_card/layer_images/layer_3_intermediate_dense.png and b/model_card/layer_images/layer_3_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_3_output_dense.png b/model_card/layer_images/layer_3_output_dense.png index 6b9b6962c1da02d67efcc7cae6aa3f9fa9706bec..f2f8f5475e5d86a3bb5ed7d605837ab40e472668 100644 Binary files a/model_card/layer_images/layer_3_output_dense.png and b/model_card/layer_images/layer_3_output_dense.png differ diff --git a/model_card/layer_images/layer_4_attention_output_dense.png b/model_card/layer_images/layer_4_attention_output_dense.png index 42fd2db9e7d1fad936de8ba8490c38243c071e1e..52ed1ac730db22de14f21aa68212b201b32178f7 100644 Binary files a/model_card/layer_images/layer_4_attention_output_dense.png and b/model_card/layer_images/layer_4_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_4_attention_self_key.png b/model_card/layer_images/layer_4_attention_self_key.png index 39872d672462feab639b54059ab663a8cfbbd300..0612a9c7d7b4734d8d069b84d41d9ad77405df4e 100644 Binary files a/model_card/layer_images/layer_4_attention_self_key.png and b/model_card/layer_images/layer_4_attention_self_key.png differ diff --git a/model_card/layer_images/layer_4_attention_self_query.png b/model_card/layer_images/layer_4_attention_self_query.png index f3596d8ff87c844e456dbbecacdb68ca50acf34a..ee8d771c1ba6622c6bc4df123084fac54599f358 100644 Binary files a/model_card/layer_images/layer_4_attention_self_query.png and b/model_card/layer_images/layer_4_attention_self_query.png differ diff --git a/model_card/layer_images/layer_4_attention_self_value.png b/model_card/layer_images/layer_4_attention_self_value.png index 399debfcb8a1091d283ecfa45f026ccdf3055b96..27e93ab4489c01ab6efcec77abeb7271eec91a3f 100644 Binary files a/model_card/layer_images/layer_4_attention_self_value.png and b/model_card/layer_images/layer_4_attention_self_value.png differ diff --git a/model_card/layer_images/layer_4_intermediate_dense.png b/model_card/layer_images/layer_4_intermediate_dense.png index 379763ae4aee80cedd2ae1e2c0b6fdb318d5f6ae..51e01ce19d21f59ea2abeed9fd3020fd9517ad12 100644 Binary files a/model_card/layer_images/layer_4_intermediate_dense.png and b/model_card/layer_images/layer_4_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_4_output_dense.png b/model_card/layer_images/layer_4_output_dense.png index 3498de55da2a21ce5038290bfccecd98d26fcecf..989e1252452dcd0312030d57031f56d42e9e7391 100644 Binary files a/model_card/layer_images/layer_4_output_dense.png and b/model_card/layer_images/layer_4_output_dense.png differ diff --git a/model_card/layer_images/layer_5_attention_output_dense.png b/model_card/layer_images/layer_5_attention_output_dense.png index ae1ae2124f8c30c5f024029b89997f225b5f6df1..74c01fd487f78006d260bb05cd624695fa612156 100644 Binary files a/model_card/layer_images/layer_5_attention_output_dense.png and b/model_card/layer_images/layer_5_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_5_attention_self_key.png b/model_card/layer_images/layer_5_attention_self_key.png index e7665bf07366dfa9fd6ef9e6b73dd0c0e8cb84b1..a0e6007bd32e7c156ca7841853d1a68b527a323c 100644 Binary files a/model_card/layer_images/layer_5_attention_self_key.png and b/model_card/layer_images/layer_5_attention_self_key.png differ diff --git a/model_card/layer_images/layer_5_attention_self_query.png b/model_card/layer_images/layer_5_attention_self_query.png index b20fb05c9452954fe97a3109d7102fd7ffccbad0..50931742024dac0f69c00ef0c8dc71725f000697 100644 Binary files a/model_card/layer_images/layer_5_attention_self_query.png and b/model_card/layer_images/layer_5_attention_self_query.png differ diff --git a/model_card/layer_images/layer_5_attention_self_value.png b/model_card/layer_images/layer_5_attention_self_value.png index ef5e4c8316996884f9cf746aafa128d28dec0ff4..ae9ae649b04c46280e96c1321d87d2d9a1832daa 100644 Binary files a/model_card/layer_images/layer_5_attention_self_value.png and b/model_card/layer_images/layer_5_attention_self_value.png differ diff --git a/model_card/layer_images/layer_5_intermediate_dense.png b/model_card/layer_images/layer_5_intermediate_dense.png index 70fcdb38cda3147805f93d3dd104f9ef15839951..5728d0d7ddfad5dbea8df9e44ea313a072a8b964 100644 Binary files a/model_card/layer_images/layer_5_intermediate_dense.png and b/model_card/layer_images/layer_5_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_5_output_dense.png b/model_card/layer_images/layer_5_output_dense.png index 49cccb63afa119f32d571c84ee345d1e220aae58..ec14107a5967e90abf3bc85e49a42fd8a3d1781b 100644 Binary files a/model_card/layer_images/layer_5_output_dense.png and b/model_card/layer_images/layer_5_output_dense.png differ diff --git a/model_card/layer_images/layer_6_attention_output_dense.png b/model_card/layer_images/layer_6_attention_output_dense.png index a855dd9469b86cfd46fa9ff812c2676fab61fa47..fc888fbd1fe9c32eccc55e36158f8804e575ac5d 100644 Binary files a/model_card/layer_images/layer_6_attention_output_dense.png and b/model_card/layer_images/layer_6_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_6_attention_self_key.png b/model_card/layer_images/layer_6_attention_self_key.png index 704e2328ce8295fb2956cf8ddb9bcd36fa86ca59..037f13819a8501ac0b30efe1566b62f0dee73145 100644 Binary files a/model_card/layer_images/layer_6_attention_self_key.png and b/model_card/layer_images/layer_6_attention_self_key.png differ diff --git a/model_card/layer_images/layer_6_attention_self_query.png b/model_card/layer_images/layer_6_attention_self_query.png index ab29025cb4df29c15f8871c68c18288fb88257cc..3968a2b40594b5e2e17ac471ac4971d64f98f32a 100644 Binary files a/model_card/layer_images/layer_6_attention_self_query.png and b/model_card/layer_images/layer_6_attention_self_query.png differ diff --git a/model_card/layer_images/layer_6_attention_self_value.png b/model_card/layer_images/layer_6_attention_self_value.png index ac9b1e2f7c6a4a82581e780d124cb3660af1ee09..0f36218d29961c7a447dffe1f4d912a0ba64a15a 100644 Binary files a/model_card/layer_images/layer_6_attention_self_value.png and b/model_card/layer_images/layer_6_attention_self_value.png differ diff --git a/model_card/layer_images/layer_6_intermediate_dense.png b/model_card/layer_images/layer_6_intermediate_dense.png index 66b85c91cf182eb5a9ff281d8725bfcf27743fbc..8b9d05c11dd0d35d1d343e25eae3729fa83d242e 100644 Binary files a/model_card/layer_images/layer_6_intermediate_dense.png and b/model_card/layer_images/layer_6_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_6_output_dense.png b/model_card/layer_images/layer_6_output_dense.png index c0e25f0bbbcc0bb87dbb1f6e96831a6c9d493cab..f9ef22695641e6392087b7a9d36ee84d021ebd41 100644 Binary files a/model_card/layer_images/layer_6_output_dense.png and b/model_card/layer_images/layer_6_output_dense.png differ diff --git a/model_card/layer_images/layer_7_attention_output_dense.png b/model_card/layer_images/layer_7_attention_output_dense.png index db44257472277173451a9b2ff007b2889540a480..362672b4e7a79cbfa19721887b6c0ade2c0235ff 100644 Binary files a/model_card/layer_images/layer_7_attention_output_dense.png and b/model_card/layer_images/layer_7_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_7_attention_self_key.png b/model_card/layer_images/layer_7_attention_self_key.png index 69876ffb9f70a12999ef570900d99eaa689c7ef9..a90ee63e0d88a9f6d801d1e2c38dd8f4d3f6cf14 100644 Binary files a/model_card/layer_images/layer_7_attention_self_key.png and b/model_card/layer_images/layer_7_attention_self_key.png differ diff --git a/model_card/layer_images/layer_7_attention_self_query.png b/model_card/layer_images/layer_7_attention_self_query.png index aebb11f380eacb31b85c05a48fb2a37fe9d0cedf..bd5cdf127158619451c9d60a58da192a460d5bb4 100644 Binary files a/model_card/layer_images/layer_7_attention_self_query.png and b/model_card/layer_images/layer_7_attention_self_query.png differ diff --git a/model_card/layer_images/layer_7_attention_self_value.png b/model_card/layer_images/layer_7_attention_self_value.png index ad03476d0b6dba975743591fb5f5b8fb04fa63a1..3fab7c062a4adbd9dcfd922aeab0ea1aab43073c 100644 Binary files a/model_card/layer_images/layer_7_attention_self_value.png and b/model_card/layer_images/layer_7_attention_self_value.png differ diff --git a/model_card/layer_images/layer_7_intermediate_dense.png b/model_card/layer_images/layer_7_intermediate_dense.png index d254d87daaa463732b324efe068eb264c3a60d7d..bf46527531955ba5c7163c0b3fa74356f9b0b5e2 100644 Binary files a/model_card/layer_images/layer_7_intermediate_dense.png and b/model_card/layer_images/layer_7_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_7_output_dense.png b/model_card/layer_images/layer_7_output_dense.png index 079706fea779863218e89e0785a8f8a924f9c5aa..d526b2d482c9b63218d5c7bdde93b4556ac73b18 100644 Binary files a/model_card/layer_images/layer_7_output_dense.png and b/model_card/layer_images/layer_7_output_dense.png differ diff --git a/model_card/layer_images/layer_8_attention_output_dense.png b/model_card/layer_images/layer_8_attention_output_dense.png index 78b99f27f1b4229d8d16c23a0e13dd78fcdf5756..a41c597503b5ecf7c5c24772144e6b441cc1471e 100644 Binary files a/model_card/layer_images/layer_8_attention_output_dense.png and b/model_card/layer_images/layer_8_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_8_attention_self_key.png b/model_card/layer_images/layer_8_attention_self_key.png index 813d203d7096125fa60340949f6dfd5b7afee964..14142d71bffd208d055ca38270d3d536053f9f22 100644 Binary files a/model_card/layer_images/layer_8_attention_self_key.png and b/model_card/layer_images/layer_8_attention_self_key.png differ diff --git a/model_card/layer_images/layer_8_attention_self_query.png b/model_card/layer_images/layer_8_attention_self_query.png index 3905bdd2aaab79759b57dd72125f76bd2c238aab..9f8dd6cd1fc78b3a75159211dabea5f00e7d9dd1 100644 Binary files a/model_card/layer_images/layer_8_attention_self_query.png and b/model_card/layer_images/layer_8_attention_self_query.png differ diff --git a/model_card/layer_images/layer_8_attention_self_value.png b/model_card/layer_images/layer_8_attention_self_value.png index fe666aa6c81ef17fb29fd5d52a5f5f575f648798..27f7b1a46bedfd5146441b421347a04b97938293 100644 Binary files a/model_card/layer_images/layer_8_attention_self_value.png and b/model_card/layer_images/layer_8_attention_self_value.png differ diff --git a/model_card/layer_images/layer_8_intermediate_dense.png b/model_card/layer_images/layer_8_intermediate_dense.png index e54ae4fb0b19b869ae10c04cb324ea3aecea53a3..4e70a378228e0a62ab4ebdf2bf8d1b2624b8f2c4 100644 Binary files a/model_card/layer_images/layer_8_intermediate_dense.png and b/model_card/layer_images/layer_8_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_8_output_dense.png b/model_card/layer_images/layer_8_output_dense.png index 4298f28dfd9679419da147735f6f3d0a30baefec..0987099f53505091fc99cd56f9548970c10ac7c7 100644 Binary files a/model_card/layer_images/layer_8_output_dense.png and b/model_card/layer_images/layer_8_output_dense.png differ diff --git a/model_card/layer_images/layer_9_attention_output_dense.png b/model_card/layer_images/layer_9_attention_output_dense.png index 22566df993d16ee4b2c9ea82a988981c753e31a5..0c6da97b3efad4bda17200212d740b97c8676fad 100644 Binary files a/model_card/layer_images/layer_9_attention_output_dense.png and b/model_card/layer_images/layer_9_attention_output_dense.png differ diff --git a/model_card/layer_images/layer_9_attention_self_key.png b/model_card/layer_images/layer_9_attention_self_key.png index b9c3bcf0225a0f66a8109ada6fc7d29c98b8ba1d..5b02898f76abe3f42403c3824fe70b5a39d9d907 100644 Binary files a/model_card/layer_images/layer_9_attention_self_key.png and b/model_card/layer_images/layer_9_attention_self_key.png differ diff --git a/model_card/layer_images/layer_9_attention_self_query.png b/model_card/layer_images/layer_9_attention_self_query.png index 1aa7dcb5fba016ff668fd38f7f6717ff44fe6437..ec1b73d1ac13ecc05af28513d0d0f26269e73cea 100644 Binary files a/model_card/layer_images/layer_9_attention_self_query.png and b/model_card/layer_images/layer_9_attention_self_query.png differ diff --git a/model_card/layer_images/layer_9_attention_self_value.png b/model_card/layer_images/layer_9_attention_self_value.png index 681f346f1c63530b0db231ffa439f542bd3234cb..1b6503cc96cad531beaef14c92117e2e8d654ec7 100644 Binary files a/model_card/layer_images/layer_9_attention_self_value.png and b/model_card/layer_images/layer_9_attention_self_value.png differ diff --git a/model_card/layer_images/layer_9_intermediate_dense.png b/model_card/layer_images/layer_9_intermediate_dense.png index 6dc244f198cb203d0b95dd063fd6539cf8b30802..81116a34135961b61b555da47e6f44787cc32492 100644 Binary files a/model_card/layer_images/layer_9_intermediate_dense.png and b/model_card/layer_images/layer_9_intermediate_dense.png differ diff --git a/model_card/layer_images/layer_9_output_dense.png b/model_card/layer_images/layer_9_output_dense.png index c19335b55c4b4ef135d297a086a14f94dfba74f1..bfe1491c9fcebec3d3e5d1ed9024ea889cc6d361 100644 Binary files a/model_card/layer_images/layer_9_output_dense.png and b/model_card/layer_images/layer_9_output_dense.png differ diff --git a/model_card/pruning.svg b/model_card/pruning.svg index 58b4e6e00839228754e356e3df4ba0f9df124eb0..0e68dc5ce5c30a78fd7bc5ea4f9cf8de7671e3bc 100644 --- a/model_card/pruning.svg +++ b/model_card/pruning.svg @@ -1 +1 @@ -43464457455389868875877901234567891011024681012prunedactivePruned Transformer HeadsLayer indexHeads count \ No newline at end of file +43464457455389868875877901234567891011024681012prunedactivePruned Transformer HeadsLayer indexHeads count \ No newline at end of file