Wootang01 commited on
Commit
d07f696
·
1 Parent(s): c1933f2

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +33 -0
app.py ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ import torch
3
+ from transformers import pipeline
4
+ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
5
+ from transformers import FSMTForConditionalGeneration, FSMTTokenizer
6
+
7
+ st.title("Paraphraser Three -- Back Translation")
8
+
9
+ user_input = st.text_area("Input sentence.")
10
+
11
+ def load_en2de():
12
+ en2de = pipeline("translation_en_to_de", model="t5-base")
13
+ return en2de
14
+
15
+ def load_de2en():
16
+ model_name = "facebook/wmt19-de-en"
17
+ tokenizer = FSMTTokenizer.from_pretrained(model_name)
18
+ model_de_to_en = FSMTForConditionalGeneration.from_pretrained(model_name)
19
+ return tokenizer, model_de_to_en
20
+
21
+ en2de = load_en2de()
22
+ tokenizer_de2en, de2en = load_de2en()
23
+
24
+ en_to_de_output = en2de(user_input)
25
+ translated_text = en_to_de_output[0]['translation_text']
26
+
27
+ input_ids = tokenizer_de2en.encode(translated_text, return_tensors="pt")
28
+ output_ids = de2en.generate(input_ids)[0]
29
+ augmented_text = tokenizer_de2en.decode(output_ids, skip_special_tokens=True)
30
+
31
+ st.write("Paraphrased text using back translation: ", augmented_text)
32
+
33
+