cstr commited on
Commit
9aac513
β€’
1 Parent(s): 4ed2821

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -618,11 +618,12 @@ def main(dataset_url, model_type, output_dataset_name, range_specification, targ
618
  gradio_title = "🧐 WMT21 Dataset Translation"
619
  gradio_desc = """This tool translates english datasets using the WMT21 translation model.
620
  ## πŸ’­ What Does This Tool Do:
621
- - Translates datasets with structures based on the selected model type.
622
  - The translation model (facebook/wmt21-dense-24-wide-en-x) supports as target languages: Hausa (ha), Icelandic (is), Japanese (ja), Czech (cs), Russian (ru), Chinese (zh), German (de)
623
- - Uploads the translated dataset to Hugging Face.
624
- - At the moment, this works only on CPU, and therefore is very very slow (>1 minute per item depending on string lengths)."""
625
  datasets_desc = """## πŸ“Š Dataset Types:
 
626
  - **mix**:
627
  - `prompt`: List of dictionaries with 'content' and 'role' fields (multi-turn conversation).
628
  - `chosen`: Single dictionary with 'content' and 'role' fields.
 
618
  gradio_title = "🧐 WMT21 Dataset Translation"
619
  gradio_desc = """This tool translates english datasets using the WMT21 translation model.
620
  ## πŸ’­ What Does This Tool Do:
621
+ - Translates datasets (as parquet files) with structures based on the selected model type (see below).
622
  - The translation model (facebook/wmt21-dense-24-wide-en-x) supports as target languages: Hausa (ha), Icelandic (is), Japanese (ja), Czech (cs), Russian (ru), Chinese (zh), German (de)
623
+ - Uploads the translated dataset as jsonl to Hugging Face.
624
+ - At the moment, this works only on CPU, and therefore is very very slow."""
625
  datasets_desc = """## πŸ“Š Dataset Types:
626
+ Note: additional fields will be kept (untranslated), an additional index field is added, which makes it easier to verify results, i.a.
627
  - **mix**:
628
  - `prompt`: List of dictionaries with 'content' and 'role' fields (multi-turn conversation).
629
  - `chosen`: Single dictionary with 'content' and 'role' fields.