Spaces:

Bikatr7
/

Kudasai

Running

App Files Files Community

Bikatr7 commited on Jun 27, 2024

Commit

8f28c9c

verified ·

1 Parent(s): 2227ae0

move to v3.4.9-beta

Browse files

Files changed (17) hide show

README.md +6 -1
demo/cote_replacements.json +3 -2
demo/genders.json +140 -0
demo/translation_settings.json +9 -7
handlers/json_handler.py +12 -18
jsons/cote_replacements.json +3 -3
lib/common/translation_settings_description.txt +4 -0
lib/gui/HUGGING_FACE_README.md +5 -0
lib/gui/save_to_file.js +2 -1
modules/common/file_ensurer.py +25 -1
modules/common/gender_util.py +420 -0
modules/common/toolkit.py +1 -1
modules/common/translator.py +34 -40
modules/gui/gui_json_util.py +2 -1
requirements.txt +2 -2
util/token_counter.py +1 -1
webgui.py +172 -74

README.md CHANGED Viewed

@@ -113,6 +113,11 @@ For further details on the settings file, see [here](#translation-with-llms-sett
     batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
     number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
     ----------------------------------------------------------------------------------
     Open AI Settings:
     See https://platform.openai.com/docs/api-reference/chat/create for further details
@@ -223,4 +228,4 @@ I actively encourage and welcome any feedback on this project.
 Kudasai gets it's original name idea from it's inspiration, Atreyagaurav's Onegai. Which also means please. You can find that [here](https://github.com/Atreyagaurav/onegai)
----------------------------------------------------------------------------------------------------------------------------------------------------

     batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
     number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
+    gender_context_insertion : true or false - Whether to insert gender info into system prompts when translating text. Kudasai will look for a "gender.json" (exactly) in the root directory and scan each text to translate for the names in the file. If a name is found, Kudasai will insert the gender info into the system prompt. For more info look at the README.md.
+    is_cote: true or false - Whether you are translating COTE (Classroom of the Elite), Kudasai has specialized functions for COTE that will be enabled if this is set to true.
     ----------------------------------------------------------------------------------
     Open AI Settings:
     See https://platform.openai.com/docs/api-reference/chat/create for further details
 Kudasai gets it's original name idea from it's inspiration, Atreyagaurav's Onegai. Which also means please. You can find that [here](https://github.com/Atreyagaurav/onegai)
+---------------------------------------------------------------------------------------------------------------------------------------------------

demo/cote_replacements.json CHANGED Viewed

@@ -87,7 +87,7 @@
     "Mika": ["美香"],
     "Minamikawa": ["南川"],
     "Namekawa": ["滑川"],
-    "Ohba": ["大場"],
     "Obokata": ["小保方"],
     "Onizuka": ["鬼塚"],
     "Ryūko": ["竜子"],
@@ -209,7 +209,8 @@
   },
   "enhanced_check_whitelist": {
-    "Hoshinomiya Chie": ["星之宮","知恵"]
   }
 }

     "Mika": ["美香"],
     "Minamikawa": ["南川"],
     "Namekawa": ["滑川"],
+    "Ōba": ["大場"],
     "Obokata": ["小保方"],
     "Onizuka": ["鬼塚"],
     "Ryūko": ["竜子"],
   },
   "enhanced_check_whitelist": {
+    "Hoshinomiya Chie": ["星之宮","知恵"],
+    "Kijima": ["鬼島"]
   }
 }

demo/genders.json ADDED Viewed

	@@ -0,0 +1,140 @@

+{
+    "Male": {
+        "Ijūin": ["伊集院"],
+        "Iki": ["井木"],
+        "Ishida": ["石田"],
+        "Keisei": ["啓誠"],
+        "Kijima": ["鬼島"],
+        "Kisarazu": ["木更津"],
+        "Kinugasa": ["衣笠"],
+        "Ohba": ["大場"],
+        "Onizuka": ["鬼塚"],
+        "Satonaka": ["里中"],
+        "Shiro": ["志朗"],
+        "Sonezaki": ["曽根崎"],
+        "Sōya": ["宗谷"],
+        "Sugio": ["杉尾"],
+        "Tatebayashi": ["舘林"],
+        "Tomose": ["トモセ"],
+        "Toyohashi": ["豊橋"],
+        "Asama Hisashi": ["浅間", "久"],
+        "Ayanokōji Atsuomi": ["綾小路", "篤臣"],
+        "Ayanokōji Kiyotaka": ["綾小路", "清隆"],
+        "Hamaguchi Tetsuya": ["浜口", "哲也"],
+        "Hashimoto Masayoshi": ["橋本", "正義"],
+        "Hirata Yōsuke": ["平田", "洋介"],
+        "Hondō Ryōtarō": ["本堂", "遼太郎"],
+        "Hōsen Kazuomi": ["宝泉", "和臣"],
+        "Ike Kanji": ["池", "寛治"],
+        "Ishigami Kyō": ["石上", "京"],
+        "Ishizaki Daichi": ["石崎", "大地"],
+        "Isomaru Yōkō": ["磯丸", "容幸"],
+        "Kamogawa Toshizō": ["鴨川", "俊三"],
+        "Kanzaki Ryūji": ["神崎", "隆二"],
+        "Katsuragi Kōhei": ["葛城", "康平"],
+        "Kiriyama Ikuto": ["桐山", "生叶"],
+        "Kitō Hayato": ["鬼頭", "隼"],
+        "Komiya Kyōgo": ["小宮", "叶吾"],
+        "Kondō Reo": ["近藤", "玲音"],
+        "Kōenji Rokusuke": ["高円寺", "六助"],
+        "Kōji Machida": ["浩二", "町田"],
+        "Kusuda Yukitsu": ["楠田", "ゆきつ"],
+        "Mashima Tomonari": ["真嶋", "智也"],
+        "Miyake Akito": ["三宅", "明人"],
+        "Miyamoto Sōshi": ["宮本", "蒼士"],
+        "Nagumo Miyabi": ["南雲", "雅"],
+        "Naoe Jinnosuke": ["直江", "仁之助"],
+        "Norihito Watanabe": ["渡辺", "紀仁"],
+        "Okitani Kyōsuke": ["沖谷", "京介"],
+        "Ryūen Kakeru": ["龍園", "翔"],
+        "Sakagami Kazuma": ["坂上", "数馬"],
+        "Sakayanagi Narimori": ["坂柳", "成守"],
+        "Sanada Kousei": ["真田", "康生"],
+        "Shiba Katsunori": ["司馬", "克典"],
+        "Shibata Sō": ["柴田", "颯"],
+        "Sotomura Hideo": ["外村", "秀雄"],
+        "Sudō Ken": ["須藤", "健"],
+        "Suzukake Tanji": ["鈴懸", "鍛治"],
+        "Tachibana Kento": ["立花", "賢人"],
+        "Takahashi Osamu": ["高橋", "修"],
+        "Tokitō Hiroya": ["時任", "裕也"],
+        "Totsuka Yahiko": ["戸塚", "弥彦"],
+        "Tsukishiro Tokinari": ["月城", "常成"],
+        "Utomiya Riku": ["宇都宮", "陸"],
+        "Yagami Takuya": ["八神", "拓也"],
+        "Yamada Albert": ["山田", "アルベルト"],
+        "Yamauchi Haruki": ["山内", "春樹"],
+        "Yanagi Yasuhisa": ["柳", "安久"],
+        "Yukimura Teruhiko": ["幸村", "輝彦"]
+    },
+    "Female": {
+        "Akiyama": ["秋山"],
+        "Isoyama": ["磯山"],
+        "Mii": ["みー"],
+        "Mika": ["美香"],
+        "Minamikawa": ["南川"],
+        "Amasawa Ichika": ["天沢", "一夏"],
+        "Amikura Mako": ["網倉", "麻子"],
+        "Andō Sayo": ["安藤", "紗代"],
+        "Asahina Nazuna": ["朝比奈", "なずな"],
+        "Azuma Sana": ["東", "咲菜"],
+        "Chabashira Sae": ["茶柱", "佐枝"],
+        "Enoshima Midoriko": ["榎嶋", "翠子"],
+        "Hasebe Haruka": ["長谷部", "波瑠加"],
+        "Himeno Yuki": ["姫野", "ユキ"],
+        "Horikita Suzune": ["堀北", "鈴音"],
+        "Hoshinomiya Chie": ["星之宮", "知恵"],
+        "Ibuki Mio": ["伊吹", "澪"],
+        "Ichinose Honami": ["一之瀬", "帆波"],
+        "Inogashira Kokoro": ["井の頭", "心"],
+        "Kamuro Masumi": ["神室", "真澄"],
+        "Karuizawa Kei": ["軽井沢", "恵"],
+        "Kikyō Kushida": ["桔梗", "櫛田"],
+        "Kinoshita Minori": ["木下", "美野里"],
+        "Kiryūin Fūka": ["鬼龍院", "楓花"],
+        "Kobashi Yume": ["小橋", "夢"],
+        "Manabe Shiho": ["真鍋", "志保"],
+        "Matsushita Chiaki": ["松下", "千秋"],
+        "Mori Nene": ["森", "寧々"],
+        "Morishita Ai": ["森下", "藍"],
+        "Nanase Tsubasa": ["七瀬", "翼"],
+        "Nishino Takeko": ["西野", "武子"],
+        "Onodera Kayano": ["小野寺", "かや乃"],
+        "Sakayanagi Arisu": ["坂柳", "有栖"],
+        "Sakura Airi": ["佐倉", "愛里"],
+        "Satō Maya": ["佐藤", "麻耶"],
+        "Shiina Hiyori": ["椎名", "ひより"],
+        "Shinohara Satsuki": ["篠原", "さつき"],
+        "Shiranami Chihiro": ["白波", "千尋"],
+        "Suchi Moeka": ["須知", "萌香"],
+        "Tachibana Akane": ["橘", "茜"],
+        "Tsubaki Sakurako": ["椿", "桜子"],
+        "Wan Mei-Yui": ["王", "美雨"],
+        "Yabu Nanami": ["藪", "菜々美"],
+        "Yamamura Miki": ["山村", "美紀"],
+        "Yamanaka Ikuko": ["山中", "郁���"],
+        "Yamashita Saki": ["鈴代", "紗弓"]
+    },
+    "Unknown": {
+        "Anzai": ["安在"],
+        "Jima": ["島"],
+        "Kosumi": ["小角"],
+        "Midora": ["美空"],
+        "Namekawa": ["滑川"],
+        "Obokata": ["小保方"],
+        "Ryūko": ["竜子"],
+        "Yano": ["矢野"],
+        "king": ["Wan-sama"],
+        "Eikura Mami": ["榮倉", "まみ"],
+        "Fukuchi Hinano": ["福地陽", "菜乃"],
+        "Hagiwara Chihaya": ["萩原", "千颯"],
+        "Hatsukawa Maho": ["初川", "舞峰"],
+        "Iguchi Yuri": ["井口", "由里"],
+        "Nishimura Ryūko": ["西村", "龍子"],
+        "Sawada Yasumi": ["沢田", "恭美"],
+        "Shintoku Tarō": ["新徳", "太郎"],
+        "Tatewaki Aoi": ["帯刀", "碧"],
+        "Tōdō Rin": ["藤堂", "凛"],
+        "Yamashita Naohisa": ["山下", "直久"]
+    }
+}

demo/translation_settings.json CHANGED Viewed

@@ -6,13 +6,15 @@
         "je_check_mode": 2,
         "number_of_malformed_batch_retries": 1,
         "batch_retry_timeout": 700,
-        "number_of_concurrent_batches": 2
     },
     "openai settings": {
-        "openai_model": "gpt-4o",
-        "openai_system_message": "As a Japanese to English translator, translate narration into English simple past, everything else should remain in its original tense. Maintain original formatting, punctuation, and paragraph structure. Keep pre-translated terms and anticipate names not replaced. Preserve terms and markers marked with >>><<< and match the output's line count to the input's. Note: 〇 indicates chapter changes.",
-        "openai_temperature": 0.3,
         "openai_top_p": 1.0,
         "openai_n": 1,
         "openai_stream": false,
@@ -24,9 +26,9 @@
     },
     "gemini settings": {
-        "gemini_model": "gemini-1.5-pro-latest",
-        "gemini_prompt": "As a Japanese to English translator, translate narration into English simple past, everything else should remain in its original tense. Maintain original formatting, punctuation, and paragraph structure. Keep pre-translated terms and anticipate names not replaced. Preserve terms and markers marked with >>><<< and match the output's line count to the input's. Note: 〇 indicates chapter changes.",
-        "gemini_temperature": 0.3,
         "gemini_top_p": null,
         "gemini_top_k": null,
         "gemini_candidate_count": 1,

         "je_check_mode": 2,
         "number_of_malformed_batch_retries": 1,
         "batch_retry_timeout": 700,
+        "number_of_concurrent_batches": 2,
+        "gender_context_insertion": true,
+        "is_cote": true
     },
     "openai settings": {
+        "openai_model": "gpt-4-turbo",
+        "openai_system_message": "As a Japanese to English translator, translate narration into simple past tense, everything else should remain in its original tense. Maintain original formatting, spacing, punctuation, and paragraph structure. Keep pre-translated terms and anticipate names not replaced. Calls and text messages should be enclosed in brackets. Preserve terms and markers marked with >>><<< and match the output's line count to the input's. Note: 〇 indicates chapter changes.",
+        "openai_temperature": 0.1,
         "openai_top_p": 1.0,
         "openai_n": 1,
         "openai_stream": false,
     },
     "gemini settings": {
+        "gemini_model": "gemini-pro",
+        "gemini_prompt": "As a Japanese to English translator, translate narration into simple past tense, everything else should remain in its original tense. Maintain original formatting, spacing, punctuation, and paragraph structure. Keep pre-translated terms and anticipate names not replaced. Calls and text messages should be enclosed in brackets. Preserve terms and markers marked with >>><<< and match the output's line count to the input's. Note: 〇 indicates chapter changes.",
+        "gemini_temperature": 0.1,
         "gemini_top_p": null,
         "gemini_top_k": null,
         "gemini_candidate_count": 1,

handlers/json_handler.py CHANGED Viewed

@@ -43,7 +43,9 @@ class JsonHandler:
             "je_check_mode",
             "number_of_malformed_batch_retries",
             "batch_retry_timeout",
-            "number_of_concurrent_batches"
         ]
         openai_keys = [
@@ -86,6 +88,8 @@ class JsonHandler:
             "je_check_mode": lambda x: isinstance(x, int) and 1 <= x <= 2,
             "number_of_malformed_batch_retries": lambda x: isinstance(x, int) and x >= 0,
             "batch_retry_timeout": lambda x: isinstance(x, int) and x >= 0,
             "number_of_concurrent_batches": lambda x: isinstance(x, int) and x >= 0,
             "openai_model": lambda x: isinstance(x, str) and x in ALLOWED_OPENAI_MODELS,
             "openai_system_message": lambda x: x not in ["", "None", None],
@@ -326,6 +330,8 @@ class JsonHandler:
             "number_of_malformed_batch_retries": {"type": int, "constraints": lambda x: x >= 0},
             "batch_retry_timeout": {"type": int, "constraints": lambda x: x >= 0},
             "number_of_concurrent_batches": {"type": int, "constraints": lambda x: x >= 0},
             "openai_model": {"type": str, "constraints": lambda x: x in ALLOWED_OPENAI_MODELS},
             "openai_system_message": {"type": str, "constraints": lambda x: x not in ["", "None", None]},
             "openai_temperature": {"type": float, "constraints": lambda x: 0 <= x <= 2},
@@ -412,26 +418,14 @@ class SettingsChanger:
         menu = """
 Current settings:
 ----------------------------------------------------------------
 """
-        for key,value in JsonHandler.current_translation_settings["base translation settings"].items():
-            menu += key + " : " + str(value) + "\n"
-        print("\n")
-        for key,value in JsonHandler.current_translation_settings["openai settings"].items():
-            menu += key + " : " + str(value) + "\n"
-        print("\n")
-        for key,value in JsonHandler.current_translation_settings["gemini settings"].items():
-            menu += key + " : " + str(value) + "\n"
-        print("\n")
-        for key,value in JsonHandler.current_translation_settings["deepl settings"].items():
-            menu += key + " : " + str(value) + "\n"
         menu += """
 It is recommended that you maximize the console window for this. You will have to to see the settings above.

             "je_check_mode",
             "number_of_malformed_batch_retries",
             "batch_retry_timeout",
+            "number_of_concurrent_batches",
+            "gender_context_insertion",
+            "is_cote"
         ]
         openai_keys = [
             "je_check_mode": lambda x: isinstance(x, int) and 1 <= x <= 2,
             "number_of_malformed_batch_retries": lambda x: isinstance(x, int) and x >= 0,
             "batch_retry_timeout": lambda x: isinstance(x, int) and x >= 0,
+            "gender_context_insertion": lambda x: isinstance(x, bool),
+            "is_cote": lambda x: isinstance(x, bool),
             "number_of_concurrent_batches": lambda x: isinstance(x, int) and x >= 0,
             "openai_model": lambda x: isinstance(x, str) and x in ALLOWED_OPENAI_MODELS,
             "openai_system_message": lambda x: x not in ["", "None", None],
             "number_of_malformed_batch_retries": {"type": int, "constraints": lambda x: x >= 0},
             "batch_retry_timeout": {"type": int, "constraints": lambda x: x >= 0},
             "number_of_concurrent_batches": {"type": int, "constraints": lambda x: x >= 0},
+            "gender_context_insertion": {"type": bool, "constraints": lambda x: isinstance(x, bool)},
+            "is_cote": {"type": bool, "constraints": lambda x: isinstance(x, bool)},
             "openai_model": {"type": str, "constraints": lambda x: x in ALLOWED_OPENAI_MODELS},
             "openai_system_message": {"type": str, "constraints": lambda x: x not in ["", "None", None]},
             "openai_temperature": {"type": float, "constraints": lambda x: 0 <= x <= 2},
         menu = """
 Current settings:
 ----------------------------------------------------------------
 """
+        settings = ["base translation settings", "openai settings", "gemini settings", "deepl settings"]
+        for setting in settings:
+            for key, value in JsonHandler.current_translation_settings[setting].items():
+                menu += key + " : " + str(value) + "\n"
+            menu += "\n"
         menu += """
 It is recommended that you maximize the console window for this. You will have to to see the settings above.

jsons/cote_replacements.json CHANGED Viewed

@@ -87,7 +87,7 @@
     "Mika": ["美香"],
     "Minamikawa": ["南川"],
     "Namekawa": ["滑川"],
-    "Ohba": ["大場"],
     "Obokata": ["小保方"],
     "Onizuka": ["鬼塚"],
     "Ryūko": ["竜子"],
@@ -103,7 +103,6 @@
     "king": ["Wan-sama"]
     },
   "full_names": {
     "Amasawa Ichika": ["天沢","一夏"],
     "Amikura Mako": ["網倉","麻子"],
@@ -209,7 +208,8 @@
   },
   "enhanced_check_whitelist": {
-    "Hoshinomiya Chie": ["星之宮","知恵"]
   }
 }

     "Mika": ["美香"],
     "Minamikawa": ["南川"],
     "Namekawa": ["滑川"],
+    "Ōba": ["大場"],
     "Obokata": ["小保方"],
     "Onizuka": ["鬼塚"],
     "Ryūko": ["竜子"],
     "king": ["Wan-sama"]
     },
   "full_names": {
     "Amasawa Ichika": ["天沢","一夏"],
     "Amikura Mako": ["網倉","麻子"],
   },
   "enhanced_check_whitelist": {
+    "Hoshinomiya Chie": ["星之宮","知恵"],
+    "Kijima": ["鬼島"]
   }
 }

lib/common/translation_settings_description.txt CHANGED Viewed

@@ -14,6 +14,10 @@ number_of_malformed_batch_retries : (Malformed batch is when je-fixing fails) Ho
 batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
 number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
 ----------------------------------------------------------------------------------
 Open AI Settings:
 See https://platform.openai.com/docs/api-reference/chat/create for further details

 batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
 number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
+gender_context_insertion : true or false - Whether to insert gender info into system prompts when translating text. Kudasai will look for a "gender.json" (exactly) in the root directory and scan each text to translate for the names in the file. If a name is found, Kudasai will insert the gender info into the system prompt. For more info look at the README.md.
+is_cote: true or false - Whether you are translating COTE (Classroom of the Elite), Kudasai has specialized functions for COTE that will be enabled if this is set to true.
 ----------------------------------------------------------------------------------
 Open AI Settings:
 See https://platform.openai.com/docs/api-reference/chat/create for further details

lib/gui/HUGGING_FACE_README.md CHANGED Viewed

@@ -113,6 +113,11 @@ For further details on the settings file, see [here](#translation-with-llms-sett
     batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
     number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
     ----------------------------------------------------------------------------------
     Open AI Settings:
     See https://platform.openai.com/docs/api-reference/chat/create for further details

     batch_retry_timeout : How long Kudasai will try to translate a batch in seconds, if a requests exceeds this duration, Kudasai will leave it untranslated.
     number_of_concurrent_batches : How many translations batches Kudasai will send to the translation API at a time. For OpenAI, be conservative as rate-limiting is aggressive, I'd suggest 3-5. For Gemini, do not exceed 15 for 1.0 or 2 for 1.5. This setting more or less doesn't matter for DeepL.
+    gender_context_insertion : true or false - Whether to insert gender info into system prompts when translating text. Kudasai will look for a "gender.json" (exactly) in the root directory and scan each text to translate for the names in the file. If a name is found, Kudasai will insert the gender info into the system prompt. For more info look at the README.md.
+    is_cote: true or false - Whether you are translating COTE (Classroom of the Elite), Kudasai has specialized functions for COTE that will be enabled if this is set to true.
     ----------------------------------------------------------------------------------
     Open AI Settings:
     See https://platform.openai.com/docs/api-reference/chat/create for further details

lib/gui/save_to_file.js CHANGED Viewed

@@ -1,4 +1,5 @@
-(text) => {
     const blob = new Blob([text], { type: 'text/plain;charset=utf-8' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');

+(text) =>
+{
     const blob = new Blob([text], { type: 'text/plain;charset=utf-8' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');

modules/common/file_ensurer.py CHANGED Viewed

@@ -58,6 +58,9 @@ class FileEnsurer():
     ## translation settings
     external_translation_settings_path = os.path.join(script_dir,'translation_settings.json')
     config_translation_settings_path = os.path.join(config_dir,'translation_settings.json')
     ## api keys
     deepl_api_key_path = os.path.join(secrets_dir, "deepl_api_key.txt")
@@ -85,7 +88,9 @@ class FileEnsurer():
         "je_check_mode": 2,
         "number_of_malformed_batch_retries": 1,
         "batch_retry_timeout": 300,
-        "number_of_concurrent_batches": 5
     },
     "openai settings": {
@@ -121,6 +126,13 @@ class FileEnsurer():
         "deepl_formality": "default"
     }
 }
     INVALID_TRANSLATION_SETTINGS_PLACEHOLDER = {
     "INVALID JSON":
     {
@@ -128,6 +140,13 @@ class FileEnsurer():
     }
     }
     ## rules
     blank_rules_path = os.path.join(jsons_dir, "blank_replacements.json")
@@ -200,6 +219,11 @@ class FileEnsurer():
             with open(FileEnsurer.config_translation_settings_path, 'w+', encoding='utf-8') as file:
                 json.dump(FileEnsurer.DEFAULT_TRANSLATION_SETTING, file)
 ##-------------------start-of-purge_storage()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
     @staticmethod

     ## translation settings
     external_translation_settings_path = os.path.join(script_dir,'translation_settings.json')
     config_translation_settings_path = os.path.join(config_dir,'translation_settings.json')
+    external_translation_genders_path = os.path.join(script_dir,'genders.json')
+    config_translation_genders_path = os.path.join(config_dir, 'genders.json')
     ## api keys
     deepl_api_key_path = os.path.join(secrets_dir, "deepl_api_key.txt")
         "je_check_mode": 2,
         "number_of_malformed_batch_retries": 1,
         "batch_retry_timeout": 300,
+        "number_of_concurrent_batches": 5,
+        "gender_context_insertion": False,
+        "is_cote": False,
     },
     "openai settings": {
         "deepl_formality": "default"
     }
 }
+    DEFAULT_GENDER_SETTINGS = {
+    "Male": {},
+    "Female": {},
+    "Unknown": {}
+    }
     INVALID_TRANSLATION_SETTINGS_PLACEHOLDER = {
     "INVALID JSON":
     {
     }
     }
+    INVALID_GENDER_SETTINGS_PLACEHOLDER = {
+    "INVALID JSON":
+    {
+        "INVALID JSON":"INVALID JSON"
+    }
+    }
     ## rules
     blank_rules_path = os.path.join(jsons_dir, "blank_replacements.json")
             with open(FileEnsurer.config_translation_settings_path, 'w+', encoding='utf-8') as file:
                 json.dump(FileEnsurer.DEFAULT_TRANSLATION_SETTING, file)
+        ## creates the genders file if it doesn't exist
+        if(os.path.exists(FileEnsurer.config_translation_genders_path) == False):
+            with open(FileEnsurer.config_translation_genders_path, 'w+', encoding='utf-8') as file:
+                json.dump(FileEnsurer.DEFAULT_GENDER_SETTINGS, file)
 ##-------------------start-of-purge_storage()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
     @staticmethod

modules/common/gender_util.py ADDED Viewed

	@@ -0,0 +1,420 @@

+## built-in libraries
+import json
+import typing
+import regex
+## custom modules
+from modules.common.file_ensurer import FileEnsurer
+##-------------------start-of-GenderUtil---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+class GenderUtil:
+    genders:typing.Optional[dict] = None
+    cache = {}
+    is_cote:bool = False
+##-------------------start-of-find_english_words()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def find_english_words(text:str) -> list[tuple[str, int]]:
+        """
+        Finds the english words in the text.
+        Parameters:
+        text (str) : The text to be searched.
+        Returns:
+        (list[tuple[str, int]]) : The list of words and their starting index.
+        """
+        return [(match.group(), match.start()) for match in regex.finditer(r'\p{Latin}+', text)]
+##-------------------start-of-is_potential_name()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def is_potential_name(word:str) -> bool:
+        """
+        Assuming words are potential names and excluding full-width Latin characters, this function returns a boolean value indicating whether the word is a potential name.
+        Parameters:
+        word (str) : The word to be checked.
+        Returns:
+        (bool) : The result of the check.
+        """
+        return not any(0xFF00 <= ord(ch) <= 0xFFEF for ch in word)
+##-------------------start-of-group_names()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def group_names(text, names_with_positions: list[tuple[str, int]], max_distance: int = 10) -> list[str]:
+        """
+        Groups names together if they follow one another within a certain distance and are separated by spaces.
+        Parameters:
+        text (str) : The text to be searched.
+        names_with_positions (list[tuple[str, int]]) : The names with their positions.
+        max_distance (int) : The maximum distance between names.
+        Returns:
+        (list[str]) : The grouped names.
+        """
+        honorifics = [
+            "chan",
+            "dono",
+            "kun",
+            "kōhai",
+            "paisen",
+            "sama",
+            "san",
+            "senpai",
+            "sensei",
+            "shi",
+            "ue"
+        ]
+        blacklist = [
+            "contents",
+        ]
+        grouped_names = []
+        i = 0
+        skip_next = False
+        length = len(names_with_positions)
+        while i < length - 1:
+            if(skip_next):
+                skip_next = False
+            else:
+                current_name, current_pos = names_with_positions[i]
+                next_name, next_pos = names_with_positions[i + 1]
+                if(current_name in blacklist):
+                    i += 1
+                    continue
+                ## Check if names are separated by spaces and are within the maximum distance.
+                separator = text[current_pos + len(current_name):next_pos]
+                if(GenderUtil.is_potential_name(next_name) and (separator.isspace()) and next_pos - current_pos <= max_distance):
+                    grouped_names.append(current_name + " " + next_name)
+                    skip_next = True
+                else:
+                    grouped_names.append(current_name)
+            i += 1
+        if(not skip_next and names_with_positions):
+            grouped_names.append(names_with_positions[-1][0])
+        ## merge honorifics with names
+        for i, name in enumerate(grouped_names):
+            if(i + 1 < len(grouped_names) and grouped_names[i + 1].lower() in honorifics):
+                grouped_names[i] += "-" + grouped_names[i + 1]
+                grouped_names.pop(i + 1)
+        return grouped_names
+##-------------------start-of-load_genders()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def load_genders() -> dict:
+        """
+        Loads the genders from the specified file path.
+        Parameters:
+        file_path (str) : The file
+        Returns:
+        (dict) : The loaded json.
+        """
+        GenderUtil.cache = {}
+        with open(FileEnsurer.config_translation_genders_path, 'r', encoding='utf-8') as file:
+            return json.load(file)
+##-------------------start-of-discard_non_names()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def discard_non_names(names: list[str]) -> list[str]:
+        """
+        Discards any names that are not in the gender list.
+        Parameters:
+        names (list[str]) : The names to be filtered.
+        Returns:
+        new_names (list[str]) : The filtered names.
+        """
+        GenderUtil.genders = GenderUtil.load_genders()
+        new_names = [
+            name for name in names
+            if any(
+                any(
+                    part == full_part
+                    for part in GenderUtil.honorific_stripper(name).split(' ')
+                    for full_part in full_name.split(' ')
+                )
+                for gender, gender_names in GenderUtil.genders.items()
+                for full_name, _ in gender_names.items()
+            )
+        ]
+        if(GenderUtil.is_cote):
+            ## known issues with cote
+            new_names = [name for name in new_names if name not in ["king"] and len(name) > 1]
+        return new_names
+##-------------------start-of-honorific_stripper()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def honorific_stripper(name:str) -> str:
+        """
+        Strips the honorific from the name.
+        Parameters:
+        name (str) : The name to be stripped.
+        Returns:
+        (str) : The stripped name.
+        """
+        if("-" in name):
+            return name.split("-")[0]
+        return name
+##-------------------start-of-reverse_honorific_stripper()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def reverse_honorific_stripper(name:str) -> str:
+        """
+        Removes the name from the honorific. (Gets the honorific)
+        Parameters:
+        name (str) : The name to be stripped.
+        Returns:
+        (str) : The stripped name.
+        """
+        if("-" in name):
+            return name.split("-")[1]
+        return ""
+##-------------------start-of-discard_similar_names()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def discard_similar_names(names: list[str]) -> list[str]:
+        """
+        Discards any names that are similar to each other.
+        This totally didn't take me literally 2 hours because I'm a dipshit who overcomplicates things.
+        Parameters:
+        names (list[str]) : The names to be filtered.
+        Returns:
+        (list[str]) : The filtered names
+        """
+        seen = set()
+        result = []
+        # Sort names by length (shortest first)
+        names.sort(key=len)
+        for name in names:
+            base_name = GenderUtil.honorific_stripper(name)
+            if(not any(base_name in seen_name or seen_name in base_name for seen_name in seen)):
+                result.append(name)
+                seen.add(base_name)
+        return result
+##-------------------start-of-find_name_gender()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def find_name_gender(name:str) -> list[str]:
+        """
+        Finds the gender associated to a name.
+        Parameters:
+        name (str) : The name to find
+        Returns:
+        result (list[str])
+        """
+        ## known names that are literally 95% this
+        cote_predetermined: typing.Dict[typing.Tuple[str, str], str] = {
+            ("Sakayanagi", "san"): "Female",
+            ("Horikita", "san"): "Female",
+            ("Horikita", ""): "Female",
+            ("Sakayanagi", ""): "Female",
+            ("Sakayanagi", "sama"): "Male",
+            ("Sakayanagi", "sensei"): "Male",
+            ("Kei", ""): "Female"
+        }
+        GenderUtil.genders = GenderUtil.load_genders()
+        if(name in GenderUtil.cache):
+            return GenderUtil.cache[name]
+        honorific = GenderUtil.reverse_honorific_stripper(name)
+        stripped_name = GenderUtil.honorific_stripper(name)
+        ## check if the name is predetermined
+        if((stripped_name, honorific) in cote_predetermined and GenderUtil.is_cote):
+            result = [cote_predetermined[(stripped_name, honorific)]]
+            GenderUtil.cache[name] = result
+            return result
+        ## this does an in operation
+        ## so it could return too many (Kei for instance, will trigger Keisei and Kei)
+        result = [gender for gender, names in GenderUtil.genders.items() for full_name in names if stripped_name in full_name]
+        ## so we can go through it again and split the full name into first and last name, compare them to the stripped name and set the result
+        if(len(result) > 1):
+            for gender, names in GenderUtil.genders.items():
+                for full_name in names:
+                    first_name = full_name.split(" ")[0]
+                    last_name = full_name.split(" ")[-1]
+                    if((first_name == stripped_name or last_name == stripped_name) and gender in result):
+                        ## need to readd, done because this can do for multiple genders
+                        result.remove(gender)
+                        result.append(gender)
+        if(len(set(result)) > 1 or result in ["Undetermined", "Unknown"]):
+            if(honorific == "kun"):
+                result = ["Male"]
+            elif(honorific == "chan"):
+                result = ["Female"]
+            else:
+                result = ["Undetermined"]
+        GenderUtil.cache[name] = result
+        return result
+##-------------------start-of-get_pronoun_assumption_for_system_prompt()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def get_pronoun_assumption_for_system_prompt(sample:str) -> typing.List[str]:
+        """
+        Gets the pronoun assumptions for a text sample so it can be used in the system prompt.
+        Parameters:
+        sample (str) : The text to be analyzed.
+        Returns:
+        pronoun_assumptions (list[str]) : The pronoun assumptions.
+        """
+        gender_to_pronoun_map = {
+            "Male": "he",
+            "Female": "she",
+            ## we used unknown in the json file, but we should use undetermined and no im not changing the json file
+            "Undetermined": "they",
+            "Unknown": "they"
+        }
+        names_with_positions = GenderUtil.find_english_words(sample)
+        potential_names_with_positions = [(name, pos) for name, pos in names_with_positions if GenderUtil.is_potential_name(name)]
+        grouped_names = GenderUtil.group_names(sample, potential_names_with_positions)
+        actual_names = GenderUtil.discard_non_names(grouped_names)
+        filtered_names = GenderUtil.discard_similar_names(actual_names)
+        assumptions = [
+            "{} : {}\n".format(name, gender[0]) if gender and len(set(gender)) == 1 and gender not in ["Undetermined", "Unknown"] else "{} : Undetermined\n".format(name)
+            for name in filtered_names
+            for gender in [GenderUtil.find_name_gender(name)]
+        ]
+        pronoun_assumptions = [
+            "{} : {}\n".format(name.strip(), gender_to_pronoun_map.get(gender.strip(), "they"))
+            for assumption in assumptions
+            for name, gender in [assumption.split(":")]
+        ]
+        return pronoun_assumptions
+##----------------start-of-get_gender_assumption_for_system_prompt()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+    @staticmethod
+    def get_gender_assumption_for_system_prompt(sample:str) -> typing.List[str]:
+        """
+        Gets the gender assumptions for a text sample.
+        Parameters:
+        sample (str) : The text to be analyzed.
+        Returns:
+        genders (list[str]) : The gender assumptions.
+        """
+        names_with_positions = GenderUtil.find_english_words(sample)
+        potential_names_with_positions = [(name, pos) for name, pos in names_with_positions if GenderUtil.is_potential_name(name)]
+        grouped_names = GenderUtil.group_names(sample, potential_names_with_positions)
+        actual_names = GenderUtil.discard_non_names(grouped_names)
+        filtered_names = GenderUtil.discard_similar_names(actual_names)
+        assumptions = [
+            "{} : {}\n".format(name, gender[0]) if gender and len(set(gender)) == 1 and gender not in ["Undetermined", "Unknown"] else "{} : Undetermined\n".format(name)
+            for name in filtered_names
+            for gender in [GenderUtil.find_name_gender(name)]
+        ]
+        gender_assumptions = [
+            "{} : {}\n".format(name.strip(), gender.strip().replace("Unknown", "Undetermined"))
+            for assumption in assumptions
+            for name, gender in [assumption.split(":")]
+        ]
+        return gender_assumptions

modules/common/toolkit.py CHANGED Viewed

@@ -15,7 +15,7 @@ class Toolkit():
     """
-    CURRENT_VERSION = "v3.4.7"
 ##-------------------start-of-clear_console()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------

     """
+    CURRENT_VERSION = "v3.4.9-beta"
 ##-------------------start-of-clear_console()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------

modules/common/translator.py CHANGED Viewed

@@ -2,6 +2,7 @@
 import typing
 import base64
 import re
 import time
 import typing
 import asyncio
@@ -21,6 +22,7 @@ from modules.common.file_ensurer import FileEnsurer
 from modules.common.toolkit import Toolkit
 from modules.common.exceptions import OpenAIAuthenticationError, MaxBatchDurationExceededException, DeepLAuthorizationException, OpenAIInternalServerError, OpenAIRateLimitError, OpenAIAPITimeoutError, GoogleAuthError, OpenAIAPIStatusError, OpenAIAPIConnectionError, DeepLException, GoogleAPIError
 from modules.common.decorators import permission_error_decorator
 ##-------------------start-of-Translator--------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -74,6 +76,8 @@ class Translator:
     number_of_malformed_batch_retries:int
     batch_retry_timeout:float
     num_concurrent_batches:int
     decorator_to_use:typing.Callable
@@ -432,6 +436,15 @@ class Translator:
         """
         logging.debug(f"Translator Activated, Translation Method : {Translator.TRANSLATION_METHOD} "
                      f"Settings are as follows : ")
@@ -444,6 +457,10 @@ class Translator:
         Translator.num_of_malform_retries = int(JsonHandler.current_translation_settings["base translation settings"]["number_of_malformed_batch_retries"])
         Translator.max_batch_duration = float(JsonHandler.current_translation_settings["base translation settings"]["batch_retry_timeout"])
         Translator.num_concurrent_batches = int(JsonHandler.current_translation_settings["base translation settings"]["number_of_concurrent_batches"])
         Translator._semaphore = asyncio.Semaphore(Translator.num_concurrent_batches)
@@ -552,36 +569,39 @@ class Translator:
         """
         async_requests = []
         translation_batches_methods = {
-            "openai": Translator.openai_translation_batches,
-            "gemini": Translator.gemini_translation_batches,
-            "deepl": Translator.deepl_translation_batches,
-            "google translate": Translator.google_translate_translation_batches
         }
         translation_batches = translation_batches_methods[Translator.TRANSLATION_METHOD]
         batch_length = len(translation_batches)
-        batch_number = 1  # Initialize batch number
         if(Translator.TRANSLATION_METHOD not in ["deepl", "google translate"]):
-            for i in range(0, batch_length, 2):
-                instructions = translation_batches[i]
-                prompt = translation_batches[i + 1]
                 assert isinstance(instructions, (SystemTranslationMessage, str))
                 assert isinstance(prompt, (ModelTranslationMessage, str))
-                async_requests.append(Translator.handle_translation(model, batch_number, batch_length//2, prompt, instructions))
-                batch_number += 1
         else:
-            for i, batch in enumerate(translation_batches):
                 assert isinstance(batch, str)
                 async_requests.append(Translator.handle_translation(model, batch_number, batch_length, batch, None))
-                batch_number += 1
         return async_requests
 ##-------------------start-of-generate_text_to_translate_batches()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -675,32 +695,6 @@ class Translator:
             elif(Translator.TRANSLATION_METHOD == 'google translate'):
                 Translator.google_translate_translation_batches.append(batch)
-        logging_message = "Built Messages: \n\n"
-        batches_to_iterate = {
-            "openai": Translator.openai_translation_batches,
-            "gemini": Translator.gemini_translation_batches,
-            "deepl": Translator.deepl_translation_batches,
-            "google translate": Translator.google_translate_translation_batches
-        }
-        i = 0
-        batches = batches_to_iterate[Translator.TRANSLATION_METHOD]
-        for message in batches:
-            i+=1
-            message = str(message) if Translator.TRANSLATION_METHOD != 'openai' else message.content # type: ignore
-            if(i % 2 == 1 and Translator.TRANSLATION_METHOD not in ['deepl', 'google_translate']):
-                logging_message += "\n" "------------------------" "\n"
-            logging_message += message + "\n"
-        logging.debug(logging_message)
 ##-------------------start-of-handle_cost_estimate_prompt()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
     @staticmethod

 import typing
 import base64
 import re
+import shutil
 import time
 import typing
 import asyncio
 from modules.common.toolkit import Toolkit
 from modules.common.exceptions import OpenAIAuthenticationError, MaxBatchDurationExceededException, DeepLAuthorizationException, OpenAIInternalServerError, OpenAIRateLimitError, OpenAIAPITimeoutError, GoogleAuthError, OpenAIAPIStatusError, OpenAIAPIConnectionError, DeepLException, GoogleAPIError
 from modules.common.decorators import permission_error_decorator
+from modules.common.gender_util import GenderUtil
 ##-------------------start-of-Translator--------------------------------------------------------------------------------------------------------------------------------------------------------------------------
     number_of_malformed_batch_retries:int
     batch_retry_timeout:float
     num_concurrent_batches:int
+    gender_context_insertion:bool
+    is_cote:bool
     decorator_to_use:typing.Callable
         """
+        if(os.path.exists(FileEnsurer.external_translation_genders_path) and not is_webgui):
+            logging.info("External genders.json file found, overriding config...")
+            shutil.copy2(FileEnsurer.external_translation_genders_path, FileEnsurer.config_translation_genders_path)
+        if(not os.path.exists(FileEnsurer.external_translation_settings_path) and not is_webgui):
+            logging.info("External translation_settings.json file not found, using config...")
+            print("External translation_settings.json file not found, using config...")
+            time.sleep(2)
         logging.debug(f"Translator Activated, Translation Method : {Translator.TRANSLATION_METHOD} "
                      f"Settings are as follows : ")
         Translator.num_of_malform_retries = int(JsonHandler.current_translation_settings["base translation settings"]["number_of_malformed_batch_retries"])
         Translator.max_batch_duration = float(JsonHandler.current_translation_settings["base translation settings"]["batch_retry_timeout"])
         Translator.num_concurrent_batches = int(JsonHandler.current_translation_settings["base translation settings"]["number_of_concurrent_batches"])
+        Translator.gender_context_insertion = bool(JsonHandler.current_translation_settings["base translation settings"]["gender_context_insertion"])
+        Translator.is_cote = bool(JsonHandler.current_translation_settings["base translation settings"]["is_cote"])
+        GenderUtil.is_cote = Translator.is_cote
         Translator._semaphore = asyncio.Semaphore(Translator.num_concurrent_batches)
         """
         async_requests = []
+        logging_message = "Built Messages: \n\n"
         translation_batches_methods = {
+            method_name: getattr(Translator, f"{method_name}_translation_batches" if method_name != "google translate" else "google_translate_translation_batches")
+            for method_name in ["openai", "gemini", "deepl", "google translate"]
         }
         translation_batches = translation_batches_methods[Translator.TRANSLATION_METHOD]
         batch_length = len(translation_batches)
+        ## if openai/gemini which are llm, they have the instructions/prompt format
         if(Translator.TRANSLATION_METHOD not in ["deepl", "google translate"]):
+            for batch_number, (instructions, prompt) in enumerate(zip(translation_batches[::2], translation_batches[1::2]), start=1):
                 assert isinstance(instructions, (SystemTranslationMessage, str))
                 assert isinstance(prompt, (ModelTranslationMessage, str))
+                if(Translator.gender_context_insertion):
+                    assumption = list(set(GenderUtil.get_gender_assumption_for_system_prompt(prompt if isinstance(prompt, str) else prompt.content)))
+                    assumption_string = "Additional Information:\nCharacter Genders:\n" + "".join(assumption) if len(assumption) > 0 else ""
+                    instructions = SystemTranslationMessage(content=f"{instructions.content if isinstance(instructions, Message) else instructions}\n{assumption_string}")
+                logging_message += f"\n------------------------\n{instructions.content if isinstance(instructions, Message) else instructions}\n{prompt if isinstance(prompt, str) else prompt.content}"
+                async_requests.append(Translator.handle_translation(model, batch_number, batch_length//2, prompt, instructions))
+        ## if deepl/google translate, they only have the prompt
         else:
+            for batch_number, batch in enumerate(translation_batches, start=1):
                 assert isinstance(batch, str)
+                logging_message += f"\n------------------------\n{batch}"
                 async_requests.append(Translator.handle_translation(model, batch_number, batch_length, batch, None))
+        logging.debug(logging_message)
         return async_requests
 ##-------------------start-of-generate_text_to_translate_batches()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
             elif(Translator.TRANSLATION_METHOD == 'google translate'):
                 Translator.google_translate_translation_batches.append(batch)
 ##-------------------start-of-handle_cost_estimate_prompt()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
     @staticmethod

modules/gui/gui_json_util.py CHANGED Viewed

@@ -56,7 +56,8 @@ class GuiJsonUtil:
             for header in new_rules.keys():
                 for key, value in new_values:
-                    new_rules[header][key] = JsonHandler.convert_to_correct_type(key, str(value))
             JsonHandler.current_translation_settings = new_rules
             JsonHandler.validate_json()

             for header in new_rules.keys():
                 for key, value in new_values:
+                    if(key in new_rules[header]):
+                        new_rules[header][key] = JsonHandler.convert_to_correct_type(key, str(value))
             JsonHandler.current_translation_settings = new_rules
             JsonHandler.validate_json()

requirements.txt CHANGED Viewed

@@ -1,5 +1,5 @@
 backoff==2.2.1
 gradio==4.20.0
-kairyou==1.6.1
-easytl==0.4.0
 ja_core_news_lg @ https://github.com/explosion/spacy-models/releases/download/ja_core_news_lg-3.7.0/ja_core_news_lg-3.7.0-py3-none-any.whl#sha256=f08eecb4d40523045c9478ce59a67564fd71edd215f32c076fa91dc1f05cc7fd

 backoff==2.2.1
 gradio==4.20.0
+kairyou==1.6.5
+easytl==0.4.3
 ja_core_news_lg @ https://github.com/explosion/spacy-models/releases/download/ja_core_news_lg-3.7.0/ja_core_news_lg-3.7.0-py3-none-any.whl#sha256=f08eecb4d40523045c9478ce59a67564fd71edd215f32c076fa91dc1f05cc7fd

util/token_counter.py CHANGED Viewed

@@ -67,7 +67,7 @@ class TokenCounter:
         print("\nNote that the cost estimate is not always accurate, and may be higher than the actual cost. However cost calculation now includes output tokens.\n")
         if(self.service == "gemini"):
-            print(f"As of Kudasai {Toolkit.CURRENT_VERSION}, Gemini Pro 1.0 is free to use under 60 requests per minute, Gemini Pro 1.5 is free to use under 2 requests per minute.\nIt is up to you to set these in the settings json.\nIt is currently unknown whether the ultra model parameter is connecting to the actual ultra model and not a pro one. As it works, but does not appear on any documentation.\n")
         print("Estimated number of tokens : " + str(num_tokens))
         print("Estimated minimum cost : " + str(min_cost) + " USD")

         print("\nNote that the cost estimate is not always accurate, and may be higher than the actual cost. However cost calculation now includes output tokens.\n")
         if(self.service == "gemini"):
+            print(f"As of Kudasai {Toolkit.CURRENT_VERSION}, Gemini Pro 1.0 is free to use under 15 requests per minute, Gemini Pro 1.5 is free to use under 2 requests per minute.\nIt is up to you to set these in the settings json.\nIt is currently unknown whether the ultra model parameter is connecting to the actual ultra model and not a pro one. As it works, but does not appear on any documentation.\n")
         print("Estimated number of tokens : " + str(num_tokens))
         print("Estimated minimum cost : " + str(min_cost) + " USD")

webgui.py CHANGED Viewed

@@ -3,6 +3,7 @@ import typing
 import base64
 import asyncio
 import os
 ## third-party libraries
 import gradio as gr
@@ -55,35 +56,37 @@ class KudasaiGUI:
         "number_of_malformed_batch_retries": lines[12-1].strip(),
         "batch_retry_timeout": lines[14-1].strip(),
         "number_of_concurrent_batches": lines[16-1].strip(),
-        "openai_help_link": lines[19-1].strip(),
-        "openai_model": lines[21-1].strip(),
-        "openai_system_message": lines[23-1].strip(),
-        "openai_temperature": lines[25-1].strip(),
-        "openai_top_p": lines[27-1].strip(),
-        "openai_n": lines[29-1].strip(),
-        "openai_stream": lines[31-1].strip(),
-        "openai_stop": lines[33-1].strip(),
-        "openai_logit_bias": lines[35-1].strip(),
-        "openai_max_tokens": lines[37-1].strip(),
-        "openai_presence_penalty": lines[39-1].strip(),
-        "openai_frequency_penalty": lines[41-1].strip(),
-        "openai_disclaimer": lines[43-1].strip(),
-        "gemini_help_link": lines[46-1].strip(),
-        "gemini_model": lines[48-1].strip(),
-        "gemini_prompt": lines[50-1].strip(),
-        "gemini_temperature": lines[52-1].strip(),
-        "gemini_top_p": lines[54-1].strip(),
-        "gemini_top_k": lines[56-1].strip(),
-        "gemini_candidate_count": lines[58-1].strip(),
-        "gemini_stream": lines[60-1].strip(),
-        "gemini_stop_sequences": lines[62-1].strip(),
-        "gemini_max_output_tokens": lines[64-1].strip(),
-        "gemini_disclaimer": lines[66-1].strip(),
-        "deepl_help_link": lines[69-1].strip(),
-        "deepl_context": lines[71-1].strip(),
-        "deepl_split_sentences": lines[73-1].strip(),
-        "deepl_preserve_formatting": lines[75-1].strip(),
-        "deepl_formality": lines[77-1].strip(),
     }
 ##-------------------start-of-build_gui()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -96,7 +99,7 @@ class KudasaiGUI:
         """
-        with gr.Blocks(title="Kudasai") as self.gui:
 ##-------------------start-of-Utility-Functions---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -259,30 +262,32 @@ class KudasaiGUI:
                     4: "number_of_malformed_batch_retries",
                     5: "batch_retry_timeout",
                     6: "number_of_concurrent_batches",
-                    7: "openai_model",
-                    8: "openai_system_message",
-                    9: "openai_temperature",
-                    10: "openai_top_p",
-                    11: "openai_n",
-                    12: "openai_stream",
-                    13: "openai_stop",
-                    14: "openai_logit_bias",
-                    15: "openai_max_tokens",
-                    16: "openai_presence_penalty",
-                    17: "openai_frequency_penalty",
-                    18: "gemini_model",
-                    19: "gemini_prompt",
-                    20: "gemini_temperature",
-                    21: "gemini_top_p",
-                    22: "gemini_top_k",
-                    23: "gemini_candidate_count",
-                    24: "gemini_stream",
-                    25: "gemini_stop_sequences",
-                    26: "gemini_max_output_tokens",
-                    27: "deepl_context",
-                    28: "deepl_split_sentences",
-                    29: "deepl_preserve_formatting",
-                    30: "deepl_formality",
                 }
                 for index, setting in enumerate(translation_settings):
@@ -381,7 +386,8 @@ class KudasaiGUI:
                         with gr.Column():
                             self.input_txt_file_translator = gr.File(label='TXT file with Japanese Text', file_count='single', file_types=['.txt'], type='filepath', interactive=True)
                             self.input_text_translator = gr.Textbox(label='Japanese Text', placeholder='Use this or the text file input, if you provide both, Kudasai will use the file input.', lines=10, show_label=True, interactive=True, type='text')
-                            self.input_translation_rules_file = gr.File(value = FileEnsurer.config_translation_settings_path, label='Translation Settings File', file_count='single', file_types=['.json'], type='filepath')
                             with gr.Row():
                                 self.llm_option_dropdown = gr.Dropdown(label='Translation Method', choices=["OpenAI", "Gemini", "DeepL", "Google Translate"], value="DeepL", show_label=True, interactive=True)
@@ -488,6 +494,20 @@ class KudasaiGUI:
                                                                                         interactive=True,
                                                                                         elem_id="number_of_concurrent_batches",
                                                                                         show_copy_button=True)
                         with gr.Column():
@@ -956,17 +976,14 @@ class KudasaiGUI:
                 JsonHandler.current_translation_settings = GuiJsonUtil.current_translation_settings
                 ## next, set the llm type
-                if(translation_method == "OpenAI"):
-                    Translator.TRANSLATION_METHOD = "openai"
-                elif(translation_method == "Gemini"):
-                    Translator.TRANSLATION_METHOD = "gemini"
-                elif(translation_method == "DeepL"):
-                    Translator.TRANSLATION_METHOD = "deepl"
-                elif(translation_method == "Google Translate"):
-                    Translator.TRANSLATION_METHOD = "google translate"
                 ## api key as well
                 await set_translator_api_key(api_key)
@@ -1131,7 +1148,7 @@ class KudasaiGUI:
 ##-------------------start-of-clear_translator_tab()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-            def clear_translator_tab() -> typing.Tuple[None, str, gr.File, str, str, str]:
                 """
@@ -1140,6 +1157,8 @@ class KudasaiGUI:
                 Returns:
                 input_txt_file_translator (gr.File) : An empty file.
                 input_text_translator (str) : An empty string.
                 translator_translated_text_output_field (str) : An empty string.
                 je_check_text_field_translator (str) : An empty string.
                 translator_debug_log_output_field (str) : An empty string.
@@ -1157,13 +1176,16 @@ class KudasaiGUI:
                 input_text_translator = ""
                 ## Also gonna want to reset the json input field to the default json file
-                input_translation_rules_file = gr.File(value = FileEnsurer.config_translation_settings_path, label='Translation Settings File', file_count='single', file_types=['.json'], type='filepath')
                 translator_translated_text_output_field = ""
                 je_check_text_field_translator = ""
                 translator_debug_log_output_field = ""
-                return input_file_translator, input_text_translator, input_translation_rules_file, translator_translated_text_output_field, je_check_text_field_translator, translator_debug_log_output_field
 ##-------------------start-of-clear_log_button_click()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -1197,6 +1219,8 @@ class KudasaiGUI:
                                         num_malformed_batch_retries:int,
                                         batch_retry_timeout:int,
                                         num_concurrent_batches:int,
                                         openai_model:str,
                                         openai_system_message:str,
                                         openai_temperature:float,
@@ -1241,6 +1265,8 @@ class KudasaiGUI:
                     num_malformed_batch_retries,
                     batch_retry_timeout,
                     num_concurrent_batches,
                     openai_model,
                     openai_system_message,
                     openai_temperature,
@@ -1270,9 +1296,9 @@ class KudasaiGUI:
                 ## create the new key-value pair list
                 new_key_value_tuple_pairs = create_new_key_value_tuple_pairs(settings_list)
                 try:
-                    ## and then have the GuiJsonUtil apply the new translator settings
                     GuiJsonUtil.update_translation_settings_with_new_values(input_translation_rules_file, new_key_value_tuple_pairs)
                 except:
@@ -1303,6 +1329,8 @@ class KudasaiGUI:
                     ("base translation settings", "number_of_malformed_batch_retries", str),
                     ("base translation settings", "batch_retry_timeout", str),
                     ("base translation settings", "number_of_concurrent_batches", str),
                     ("openai settings", "openai_model", str),
                     ("openai settings", "openai_system_message", str),
                     ("openai settings", "openai_temperature", float),
@@ -1360,6 +1388,8 @@ class KudasaiGUI:
                         ("base translation settings", "number_of_malformed_batch_retries", str),
                         ("base translation settings", "batch_retry_timeout", str),
                         ("base translation settings", "number_of_concurrent_batches", str),
                         ("openai settings", "openai_model", str),
                         ("openai settings", "openai_system_message", str),
                         ("openai settings", "openai_temperature", float),
@@ -1393,6 +1423,51 @@ class KudasaiGUI:
                     raise gr.Error("Invalid Custom Translation Settings File")
                 return return_batch
 ##-------------------start-of-clear_translation_settings_input_fields()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
@@ -1414,6 +1489,8 @@ class KudasaiGUI:
                     "num_malformed_batch_retries_value": None,
                     "batch_retry_timeout_value": None,
                     "num_concurrent_batches_value": None,
                     "openai_model_value": None,
                     "openai_system_message_value": None,
                     "openai_temperature_value": None,
@@ -1566,8 +1643,6 @@ class KudasaiGUI:
                                                     self.logging_tab_debug_log_output_field, ## debug log on log tab
                                                     self.logging_tab_error_log_output_field]) ## error log on log tab
 ##-------------------start-of-translate_with_translator()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
             ## for the actual translation, and the je check text
@@ -1592,7 +1667,6 @@ class KudasaiGUI:
                                                 every=.1) ## update every 100ms
 ##-------------------start-of translator_calculate_costs_button_click()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
             self.translator_calculate_cost_button.click(translator_calculate_costs_button_click,
@@ -1641,6 +1715,7 @@ class KudasaiGUI:
                                                 self.input_txt_file_translator, ## input txt file
                                                 self.input_text_translator, ## input text
                                                 self.input_translation_rules_file, ## Translation Settings File
                                                 self.translator_translated_text_output_field, ## translation output field
                                                 self.translator_je_check_text_output_field, ## je check text field on translator tab
                                                 self.translator_debug_log_output_field], ## debug log on translator tab
@@ -1668,6 +1743,8 @@ class KudasaiGUI:
                                                 self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                 self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                 self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
                                                 self.openai_model_input_field, ## openai model input field
                                                 self.openai_system_message_input_field, ## openai system message input field
                                                 self.openai_temperature_input_field, ## openai temperature input field
@@ -1708,6 +1785,8 @@ class KudasaiGUI:
                                                         self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                         self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                         self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
                                                         self.openai_model_input_field, ## openai model input field
                                                         self.openai_system_message_input_field, ## openai system message input field
                                                         self.openai_temperature_input_field, ## openai temperature input field
@@ -1746,6 +1825,8 @@ class KudasaiGUI:
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
@@ -1784,6 +1865,8 @@ class KudasaiGUI:
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
@@ -1821,6 +1904,8 @@ class KudasaiGUI:
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
@@ -1845,6 +1930,19 @@ class KudasaiGUI:
                                                     self.deepl_split_sentences_input_field, ## deepl split sentences input field
                                                     self.deepl_preserve_formatting_input_field, ## deepl preserve formatting input field
                                                     self.deepl_formality_input_field]) ## deepl formality input field
 ##-------------------start-of-logging_tab.select()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------

 import base64
 import asyncio
 import os
+import json
 ## third-party libraries
 import gradio as gr
         "number_of_malformed_batch_retries": lines[12-1].strip(),
         "batch_retry_timeout": lines[14-1].strip(),
         "number_of_concurrent_batches": lines[16-1].strip(),
+        "gender_context_insertion": lines[18-1].strip(),
+        "is_cote": lines[20-1].strip(),
+        "openai_help_link": lines[23-1].strip(),
+        "openai_model": lines[25-1].strip(),
+        "openai_system_message": lines[27-1].strip(),
+        "openai_temperature": lines[29-1].strip(),
+        "openai_top_p": lines[31-1].strip(),
+        "openai_n": lines[33-1].strip(),
+        "openai_stream": lines[35-1].strip(),
+        "openai_stop": lines[37-1].strip(),
+        "openai_logit_bias": lines[39-1].strip(),
+        "openai_max_tokens": lines[41-1].strip(),
+        "openai_presence_penalty": lines[43-1].strip(),
+        "openai_frequency_penalty": lines[45-1].strip(),
+        "openai_disclaimer": lines[47-1].strip(),
+        "gemini_help_link": lines[50-1].strip(),
+        "gemini_model": lines[52-1].strip(),
+        "gemini_prompt": lines[54-1].strip(),
+        "gemini_temperature": lines[56-1].strip(),
+        "gemini_top_p": lines[58-1].strip(),
+        "gemini_top_k": lines[60-1].strip(),
+        "gemini_candidate_count": lines[62-1].strip(),
+        "gemini_stream": lines[64-1].strip(),
+        "gemini_stop_sequences": lines[66-1].strip(),
+        "gemini_max_output_tokens": lines[68-1].strip(),
+        "gemini_disclaimer": lines[70-1].strip(),
+        "deepl_help_link": lines[73-1].strip(),
+        "deepl_context": lines[75-1].strip(),
+        "deepl_split_sentences": lines[77-1].strip(),
+        "deepl_preserve_formatting": lines[79-1].strip(),
+        "deepl_formality": lines[81-1].strip(),
     }
 ##-------------------start-of-build_gui()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
         """
+        with gr.Blocks(title="Kudasai", delete_cache=(300, 300)) as self.gui:
 ##-------------------start-of-Utility-Functions---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
                     4: "number_of_malformed_batch_retries",
                     5: "batch_retry_timeout",
                     6: "number_of_concurrent_batches",
+                    7: "gender_context_insertion",
+                    8: "is_cote",
+                    9: "openai_model",
+                    10: "openai_system_message",
+                    11: "openai_temperature",
+                    12: "openai_top_p",
+                    13: "openai_n",
+                    14: "openai_stream",
+                    15: "openai_stop",
+                    16: "openai_logit_bias",
+                    17: "openai_max_tokens",
+                    18: "openai_presence_penalty",
+                    19: "openai_frequency_penalty",
+                    20: "gemini_model",
+                    21: "gemini_prompt",
+                    22: "gemini_temperature",
+                    23: "gemini_top_p",
+                    24: "gemini_top_k",
+                    25: "gemini_candidate_count",
+                    26: "gemini_stream",
+                    27: "gemini_stop_sequences",
+                    28: "gemini_max_output_tokens",
+                    29: "deepl_context",
+                    30: "deepl_split_sentences",
+                    31: "deepl_preserve_formatting",
+                    32: "deepl_formality",
                 }
                 for index, setting in enumerate(translation_settings):
                         with gr.Column():
                             self.input_txt_file_translator = gr.File(label='TXT file with Japanese Text', file_count='single', file_types=['.txt'], type='filepath', interactive=True)
                             self.input_text_translator = gr.Textbox(label='Japanese Text', placeholder='Use this or the text file input, if you provide both, Kudasai will use the file input.', lines=10, show_label=True, interactive=True, type='text')
+                            self.input_translation_rules_file = gr.File(value = FileEnsurer.config_translation_settings_path, label='Translation Settings File', file_count='single', file_types=['.json'], type='filepath', interactive=True)
+                            self.input_genders_file = gr.File(value=FileEnsurer.config_translation_genders_path, label='Genders.json File', file_count='single', file_types=['.json'], type='filepath', interactive=True)
                             with gr.Row():
                                 self.llm_option_dropdown = gr.Dropdown(label='Translation Method', choices=["OpenAI", "Gemini", "DeepL", "Google Translate"], value="DeepL", show_label=True, interactive=True)
                                                                                         interactive=True,
                                                                                         elem_id="number_of_concurrent_batches",
                                                                                         show_copy_button=True)
+                            self.gender_context_insertion_input_field = gr.Checkbox(label="Gender Context Insertion",
+                                                                                    value=bool(GuiJsonUtil.fetch_translation_settings_key_values("base translation settings","gender_context_insertion")),
+                                                                                    info=KudasaiGUI.description_dict.get("gender_context_insertion"),
+                                                                                    show_label=True,
+                                                                                    interactive=True,
+                                                                                    elem_id="number_of_concurrent_batches")
+                            self.is_cote_input_field = gr.Checkbox(label="Is Cote",
+                                                                    value=bool(GuiJsonUtil.fetch_translation_settings_key_values("base translation settings","is_cote")),
+                                                                    info=KudasaiGUI.description_dict.get("is_cote"),
+                                                                    show_label=True,
+                                                                    interactive=True,
+                                                                    elem_id="is_cote")
                         with gr.Column():
                 JsonHandler.current_translation_settings = GuiJsonUtil.current_translation_settings
                 ## next, set the llm type
+                translation_methods = {
+                    "OpenAI": "openai",
+                    "Gemini": "gemini",
+                    "DeepL": "deepl",
+                    "Google Translate": "google translate"
+                }
+                Translator.TRANSLATION_METHOD = translation_methods.get(translation_method, "") # type: ignore
                 ## api key as well
                 await set_translator_api_key(api_key)
 ##-------------------start-of-clear_translator_tab()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+            def clear_translator_tab() -> typing.Tuple[None, str, gr.File, gr.File, str, str, str]:
                 """
                 Returns:
                 input_txt_file_translator (gr.File) : An empty file.
                 input_text_translator (str) : An empty string.
+                input_translation_rules_file (gr.File) : An empty file.
+                input_genders_file (gr.File) : An empty file.
                 translator_translated_text_output_field (str) : An empty string.
                 je_check_text_field_translator (str) : An empty string.
                 translator_debug_log_output_field (str) : An empty string.
                 input_text_translator = ""
                 ## Also gonna want to reset the json input field to the default json file
+                input_translation_rules_file = gr.File(value = FileEnsurer.config_translation_settings_path, label='Translation Settings File', file_count='single', file_types=['.json'], type='filepath', interactive=True)
+                ## same for genders shit
+                input_genders_file = gr.File(value=(FileEnsurer.config_translation_genders_path), label='Genders.json File', file_count='single', file_types=['.json'], type='filepath', interactive=True)
                 translator_translated_text_output_field = ""
                 je_check_text_field_translator = ""
                 translator_debug_log_output_field = ""
+                return input_file_translator, input_text_translator, input_translation_rules_file, input_genders_file, translator_translated_text_output_field, je_check_text_field_translator, translator_debug_log_output_field
 ##-------------------start-of-clear_log_button_click()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
                                         num_malformed_batch_retries:int,
                                         batch_retry_timeout:int,
                                         num_concurrent_batches:int,
+                                        gender_context_insertion:bool,
+                                        is_cote:bool,
                                         openai_model:str,
                                         openai_system_message:str,
                                         openai_temperature:float,
                     num_malformed_batch_retries,
                     batch_retry_timeout,
                     num_concurrent_batches,
+                    gender_context_insertion,
+                    is_cote,
                     openai_model,
                     openai_system_message,
                     openai_temperature,
                 ## create the new key-value pair list
                 new_key_value_tuple_pairs = create_new_key_value_tuple_pairs(settings_list)
                 try:
+                    ## and then have the GuiJsonUtil apply the new translator settings
                     GuiJsonUtil.update_translation_settings_with_new_values(input_translation_rules_file, new_key_value_tuple_pairs)
                 except:
                     ("base translation settings", "number_of_malformed_batch_retries", str),
                     ("base translation settings", "batch_retry_timeout", str),
                     ("base translation settings", "number_of_concurrent_batches", str),
+                    ("base translation settings", "gender_context_insertion", bool),
+                    ("base translation settings", "is_cote", bool),
                     ("openai settings", "openai_model", str),
                     ("openai settings", "openai_system_message", str),
                     ("openai settings", "openai_temperature", float),
                         ("base translation settings", "number_of_malformed_batch_retries", str),
                         ("base translation settings", "batch_retry_timeout", str),
                         ("base translation settings", "number_of_concurrent_batches", str),
+                        ("base translation settings", "gender_context_insertion", bool),
+                        ("base translation settings", "is_cote", bool),
                         ("openai settings", "openai_model", str),
                         ("openai settings", "openai_system_message", str),
                         ("openai settings", "openai_temperature", float),
                     raise gr.Error("Invalid Custom Translation Settings File")
                 return return_batch
+##-------------------start-of-set_genders_file()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+            def set_genders_file(input_gender_file:gr.File):
+                """
+                Sets the genders file.
+                """
+                try:
+                    contents = gui_get_json_from_file(input_gender_file)
+                    with open(FileEnsurer.config_translation_genders_path, "w", encoding="utf-8") as f:
+                        json.dump(contents, f, indent=4)
+                except Exception as e:
+                    raise gr.Error(f"Error {e} occurred while setting genders file.")
+##----------------start-of-clear_genders_file()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+            def clear_genders_file(temp_file:gr.File) -> None:
+                """
+                Clears the genders file.
+                """
+                try:
+                    with open(FileEnsurer.config_translation_genders_path, "w", encoding="utf-8") as f:
+                        json.dump(FileEnsurer.DEFAULT_GENDER_SETTINGS, f, indent=4)
+                    with open(temp_file.name, "w", encoding="utf-8") as f: #   type: ignore
+                        json.dump(FileEnsurer.DEFAULT_GENDER_SETTINGS, f, indent=4)
+                except:
+                    pass
+                return None
 ##-------------------start-of-clear_translation_settings_input_fields()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
                     "num_malformed_batch_retries_value": None,
                     "batch_retry_timeout_value": None,
                     "num_concurrent_batches_value": None,
+                    "gender_context_insertion_value": None,
+                    "is_cote_value": None,
                     "openai_model_value": None,
                     "openai_system_message_value": None,
                     "openai_temperature_value": None,
                                                     self.logging_tab_debug_log_output_field, ## debug log on log tab
                                                     self.logging_tab_error_log_output_field]) ## error log on log tab
 ##-------------------start-of-translate_with_translator()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
             ## for the actual translation, and the je check text
                                                 every=.1) ## update every 100ms
 ##-------------------start-of translator_calculate_costs_button_click()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
             self.translator_calculate_cost_button.click(translator_calculate_costs_button_click,
                                                 self.input_txt_file_translator, ## input txt file
                                                 self.input_text_translator, ## input text
                                                 self.input_translation_rules_file, ## Translation Settings File
+                                                self.input_genders_file, ## Gender File
                                                 self.translator_translated_text_output_field, ## translation output field
                                                 self.translator_je_check_text_output_field, ## je check text field on translator tab
                                                 self.translator_debug_log_output_field], ## debug log on translator tab
                                                 self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                 self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                 self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
+                                                self.gender_context_insertion_input_field, ## gender context insertion input field
+                                                self.is_cote_input_field, ## is cote input field
                                                 self.openai_model_input_field, ## openai model input field
                                                 self.openai_system_message_input_field, ## openai system message input field
                                                 self.openai_temperature_input_field, ## openai temperature input field
                                                         self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                         self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                         self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
+                                                        self.gender_context_insertion_input_field, ## gender context insertion input field
+                                                        self.is_cote_input_field, ## is cote input field
                                                         self.openai_model_input_field, ## openai model input field
                                                         self.openai_system_message_input_field, ## openai system message input field
                                                         self.openai_temperature_input_field, ## openai temperature input field
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
+                                                    self.gender_context_insertion_input_field, ## gender context insertion input field
+                                                    self.is_cote_input_field, ## is cote input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
+                                                    self.gender_context_insertion_input_field, ## gender context insertion input field
+                                                    self.is_cote_input_field, ## is cote input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
                                                     self.number_of_malformed_batch_retries_input_field, ## num malformed batch retries input field
                                                     self.batch_retry_timeout_input_field, ## batch retry timeout input field
                                                     self.number_of_concurrent_batches_input_field, ## num concurrent batches input field
+                                                    self.gender_context_insertion_input_field, ## gender context insertion input field
+                                                    self.is_cote_input_field, ## is cote input field
                                                     self.openai_model_input_field, ## openai model input field
                                                     self.openai_system_message_input_field, ## openai system message input field
                                                     self.openai_temperature_input_field, ## openai temperature input field
                                                     self.deepl_split_sentences_input_field, ## deepl split sentences input field
                                                     self.deepl_preserve_formatting_input_field, ## deepl preserve formatting input field
                                                     self.deepl_formality_input_field]) ## deepl formality input field
+##----------------start-of-input_genders_file_upload()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+            self.input_genders_file.upload(set_genders_file,
+                                        inputs=[self.input_genders_file],
+                                        outputs=[]
+            )
+            self.input_genders_file.clear(clear_genders_file,
+                                        inputs=[self.input_genders_file],
+                                        outputs=[self.input_genders_file]
+            )
 ##-------------------start-of-logging_tab.select()---------------------------------------------------------------------------------------------------------------------------------------------------------------------------