Spaces:

barbaroo
/

Faroese_English_Ukranian_Translator

Runtime error

App Files Files Community

barbaroo commited on Jun 6

Commit

79787d6

•

1 Parent(s): 873d959

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -7

app.py CHANGED Viewed

@@ -11,6 +11,8 @@ nltk.download('punkt')
 # Load the models and tokenizers
 model_checkpoint_fo_en = "barbaroo/nllb_200_600M_fo_en"
 model_checkpoint_en_fo = "barbaroo/nllb_200_600M_en_fo"
 tokenizer_fo_en = AutoTokenizer.from_pretrained(model_checkpoint_fo_en)
 model_fo_en = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_fo_en)
@@ -18,14 +20,22 @@ model_fo_en = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_fo_en)
 tokenizer_en_fo = AutoTokenizer.from_pretrained(model_checkpoint_en_fo)
 model_en_fo = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_en_fo)
 # Check if a GPU is available and move models to GPU if possible
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 print(f"Using device: {device}")
 if torch.cuda.is_available():
     print("GPU is available. Initializing models on GPU.")
-    #model_fo_en.to(device)
-    #model_en_fo.to(device)
 else:
     print("GPU is not available. Using CPU.")
@@ -34,7 +44,7 @@ def split_into_sentences(text):
 @spaces.GPU
 def translate(text, model, tokenizer, max_length=80):
-    # Make sure model and tokenizer are on the correct device
     model.to(device)
     sentences = split_into_sentences(text)
@@ -63,9 +73,29 @@ def handle_input(text, file, direction):
     if direction == "fo_en":
         model = model_fo_en
         tokenizer = tokenizer_fo_en
-    else:
         model = model_en_fo
         tokenizer = tokenizer_en_fo
     # Translate the text if it's not empty
     if text:
@@ -79,11 +109,11 @@ iface = gr.Interface(
     inputs=[
         gr.Textbox(lines=2, placeholder="Type here or upload a text file..."),
         gr.File(label="or Upload Text File", type="binary"),
-        gr.Dropdown(label="Translation Direction", choices=["fo_en", "en_fo"], value="fo_en")
     ],
     outputs="text",
-    title="Bidirectional Translator",
-    description="Enter text directly or upload a text file (.txt) to translate between Faroese and English."
 )
 # Launch the interface

 # Load the models and tokenizers
 model_checkpoint_fo_en = "barbaroo/nllb_200_600M_fo_en"
 model_checkpoint_en_fo = "barbaroo/nllb_200_600M_en_fo"
+model_checkpoint_uk_en = "Helsinki-NLP/opus-mt-uk-en"
+model_checkpoint_en_uk = "Helsinki-NLP/opus-mt-en-uk"
 tokenizer_fo_en = AutoTokenizer.from_pretrained(model_checkpoint_fo_en)
 model_fo_en = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_fo_en)
 tokenizer_en_fo = AutoTokenizer.from_pretrained(model_checkpoint_en_fo)
 model_en_fo = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_en_fo)
+tokenizer_uk_en = AutoTokenizer.from_pretrained(model_checkpoint_uk_en)
+model_uk_en = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_uk_en)
+tokenizer_en_uk = AutoTokenizer.from_pretrained(model_checkpoint_en_uk)
+model_en_uk = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint_en_uk)
 # Check if a GPU is available and move models to GPU if possible
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 print(f"Using device: {device}")
 if torch.cuda.is_available():
     print("GPU is available. Initializing models on GPU.")
+    model_fo_en.to(device)
+    model_en_fo.to(device)
+    model_uk_en.to(device)
+    model_en_uk.to(device)
 else:
     print("GPU is not available. Using CPU.")
 @spaces.GPU
 def translate(text, model, tokenizer, max_length=80):
+    # Ensure model is on the correct device
     model.to(device)
     sentences = split_into_sentences(text)
     if direction == "fo_en":
         model = model_fo_en
         tokenizer = tokenizer_fo_en
+    elif direction == "en_fo":
         model = model_en_fo
         tokenizer = tokenizer_en_fo
+    elif direction == "uk_en":
+        model = model_uk_en
+        tokenizer = tokenizer_uk_en
+    elif direction == "en_uk":
+        model = model_en_uk
+        tokenizer = tokenizer_en_uk
+    elif direction == "uk_fo":
+        # Ukrainian to Faroese via English pivot
+        model = model_uk_en
+        tokenizer = tokenizer_uk_en
+        text = translate(text, model, tokenizer)
+        model = model_en_fo
+        tokenizer = tokenizer_en_fo
+    elif direction == "fo_uk":
+        # Faroese to Ukrainian via English pivot
+        model = model_fo_en
+        tokenizer = tokenizer_fo_en
+        text = translate(text, model, tokenizer)
+        model = model_en_uk
+        tokenizer = tokenizer_en_uk
     # Translate the text if it's not empty
     if text:
     inputs=[
         gr.Textbox(lines=2, placeholder="Type here or upload a text file..."),
         gr.File(label="or Upload Text File", type="binary"),
+        gr.Dropdown(label="Translation Direction", choices=["fo_en", "en_fo", "uk_en", "en_uk", "uk_fo", "fo_uk"], value="fo_en")
     ],
     outputs="text",
+    title="Multilingual Translator",
+    description="Enter text directly or upload a text file (.txt) to translate between Faroese, Ukrainian, and English."
 )
 # Launch the interface