maxbittker commited on
Commit
799254d
1 Parent(s): d510d4c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -11
app.py CHANGED
@@ -10,16 +10,16 @@ LANG_CODES = {
10
  "toki pona":"tl"
11
  }
12
 
13
- def translate(text, src_lang, tgt_lang, candidates:int):
14
  """
15
  Translate the text from source lang to target lang
16
  """
17
 
18
- src = LANG_CODES.get(src_lang)
19
- tgt = LANG_CODES.get(tgt_lang)
20
 
21
- tokenizer.src_lang = src
22
- tokenizer.tgt_lang = tgt
23
 
24
  ins = tokenizer(text, return_tensors='pt').to(device)
25
 
@@ -28,8 +28,8 @@ def translate(text, src_lang, tgt_lang, candidates:int):
28
  'output_scores': True,
29
  'output_hidden_states': True,
30
  'length_penalty': 0.0, # don't encourage longer or shorter output,
31
- 'num_return_sequences': candidates,
32
- 'num_beams':candidates,
33
  'forced_bos_token_id': tokenizer.lang_code_to_id[tgt]
34
  }
35
 
@@ -78,11 +78,11 @@ with gr.Blocks() as app:
78
  gr.Markdown(markdown)
79
  with gr.Column():
80
  input_text = gr.components.Textbox(label="Input Text", value="Raccoons are fascinating creatures, but I prefer opossums.")
81
- source_lang = gr.components.Dropdown(label="Source Language", value="English", choices=list(LANG_CODES.keys()))
82
- target_lang = gr.components.Dropdown(label="Target Language", value="toki pona", choices=list(LANG_CODES.keys()))
83
- return_seqs = gr.Slider(label="Number of return sequences", value=3, minimum=1, maximum=12, step=1)
84
 
85
- inputs=[input_text, source_lang, target_lang, return_seqs]
86
  outputs = gr.Textbox()
87
 
88
  translate_btn = gr.Button("Translate! | o ante toki!")
 
10
  "toki pona":"tl"
11
  }
12
 
13
+ def translate(text):
14
  """
15
  Translate the text from source lang to target lang
16
  """
17
 
18
+ # src = LANG_CODES.get(src_lang)
19
+ # tgt = LANG_CODES.get(tgt_lang)
20
 
21
+ tokenizer.src_lang = "en"
22
+ tokenizer.tgt_lang = "tl"
23
 
24
  ins = tokenizer(text, return_tensors='pt').to(device)
25
 
 
28
  'output_scores': True,
29
  'output_hidden_states': True,
30
  'length_penalty': 0.0, # don't encourage longer or shorter output,
31
+ 'num_return_sequences': 1,
32
+ 'num_beams':1,
33
  'forced_bos_token_id': tokenizer.lang_code_to_id[tgt]
34
  }
35
 
 
78
  gr.Markdown(markdown)
79
  with gr.Column():
80
  input_text = gr.components.Textbox(label="Input Text", value="Raccoons are fascinating creatures, but I prefer opossums.")
81
+ # source_lang = gr.components.Dropdown(label="Source Language", value="English", choices=list(LANG_CODES.keys()))
82
+ # target_lang = gr.components.Dropdown(label="Target Language", value="toki pona", choices=list(LANG_CODES.keys()))
83
+ # return_seqs = gr.Slider(label="Number of return sequences", value=3, minimum=1, maximum=12, step=1)
84
 
85
+ inputs=[input_text]
86
  outputs = gr.Textbox()
87
 
88
  translate_btn = gr.Button("Translate! | o ante toki!")