Spaces:
Build error
Build error
| import gradio as gr | |
| import yaml | |
| from joeynmt.prediction import load_params_for_prediction,translate_for_hf_space | |
| from huggingface_hub import hf_hub_download | |
| language_map = {'English':'en','Swahili':'sw','Fon':'fon','Igbo':'ig', | |
| 'Arabic':'ar','Shona':'sn','Ẹ̀dó':'bin','Hausa':'ha', | |
| 'Efik':'efi','Twi':'twi','Afrikaans':'af','Yoruba':'yo','Urhobo':'urh','Dendi':'ddn','̀Ẹ̀sán':'ish','Isoko':'iso', | |
| 'Kamba':'kam','Luo':'luo','Southern Ndebele':'nr','Tshivenda':'ve'} | |
| #List of available languages I worked on. | |
| #... | |
| available_language_pairs =['en-sw','en-af','en-ar','en-ddn','en-ish','en-iso','en-kam','en-luo','en-nr','en-ve','efi-en','en-bin','en-ha','en-ig','en-fon','en-twi','sn-en','sw-en','yo-en','en-urh'] | |
| available_languages = list(language_map.keys()) | |
| def load_config(path="configs/default.yaml") -> dict: | |
| """ | |
| CODE ADAPTED FROM: https://github.com/joeynmt/joeynmt | |
| Loads and parses a YAML configuration file. | |
| :param path: path to YAML configuration file | |
| :return: configuration dictionary | |
| """ | |
| with open(path, 'r', encoding="utf-8") as ymlfile: | |
| cfg = yaml.safe_load(ymlfile) | |
| return cfg | |
| def load_model(source_language,target_language): | |
| #source_language = language_map[source_language_] | |
| #target_language = language_map[target_language_] | |
| translation_dir = 'main' | |
| try: | |
| file_yaml = hf_hub_download("chrisjay/masakhane_benchmarks", filename=f"{source_language}-{target_language}/{translation_dir}/config.yaml",force_filename='config.yaml') | |
| src_vocab = hf_hub_download("chrisjay/masakhane_benchmarks", filename=f"{source_language}-{target_language}/{translation_dir}/src_vocab.txt") | |
| trg_vocab = hf_hub_download("chrisjay/masakhane_benchmarks", filename=f"{source_language}-{target_language}/{translation_dir}/trg_vocab.txt") | |
| best_ckpt = hf_hub_download("chrisjay/masakhane_benchmarks", filename=f"{source_language}-{target_language}/{translation_dir}/best.ckpt") | |
| except Exception: | |
| raise Exception(f'It seems we do not have a working configuration repo yet for {source_language} -> {target_language}. \n You could help us by creating it here: https://huggingface.co/chrisjay/masakhane_benchmarks/tree/main') | |
| parsed_yaml_file = load_config(file_yaml) | |
| parsed_yaml_file['data']['src_vocab']=src_vocab | |
| parsed_yaml_file['data']['trg_vocab']=trg_vocab | |
| params = load_params_for_prediction(parsed_yaml_file,best_ckpt) | |
| return params | |
| #Load models of all available language pairs | |
| model_mapping = {} | |
| examples_available_models=[] # Keep track of models that loaded successfully and display only them in the Examples. | |
| for availabe_lang in available_language_pairs: | |
| try: | |
| model_mapping.update({availabe_lang:load_model(availabe_lang.split('-')[0],availabe_lang.split('-')[1])}) | |
| examples_available_models.append([f"{list(language_map.keys())[list(language_map.values()).index(availabe_lang.split('-')[0])]}",f"{list(language_map.keys())[list(language_map.values()).index(availabe_lang.split('-')[1])]}"]) #idea to extract key from value got from https://stackoverflow.com/questions/8023306/get-key-by-value-in-dictionary | |
| except Exception: | |
| continue | |
| if examples_available_models==[]: | |
| raise Exception(f'Available models for Space cannot be empty!') | |
| def get_translation(source_language,target_language,source_sentence=None,source_file=None): | |
| ''' | |
| This takes a sentence and gets the translation. | |
| ''' | |
| source_language_ = language_map[source_language] | |
| target_language_ = language_map[target_language] | |
| source = source_sentence | |
| translation_type='sentence' | |
| if source_file!=None: | |
| translation_type='file' | |
| source = source_file.name | |
| try: | |
| params = model_mapping[f'{source_language_}-{target_language_}'] | |
| pred = translate_for_hf_space(params,source,translation_type) | |
| except Exception: | |
| return f'There was an issue loading the translation model for {source_language} -> {target_language}. Try another pair please' | |
| return pred[0] if source_file==None else pred | |
| title = "Interact with Masakhane Benchmark Models" | |
| description = "This enables you to interact with some of the Masakhane Benchmark Models and keep up with their improvement. Some of these models undergo finetuning on a regular basis. This way, you can easily use the best model with no hassles." | |
| iface = gr.Interface(fn=get_translation, | |
| inputs=[gr.inputs.Dropdown(choices = available_languages,default='English'), | |
| gr.inputs.Dropdown(choices = available_languages,default='Swahili'), | |
| gr.inputs.Textbox(label="Input"), | |
| gr.inputs.File(file_count="single", type="file", label='Or upload txt file containing sentences', optional=True)], | |
| outputs=gr.outputs.Textbox(type="auto", label='Translation'), | |
| title=title, | |
| description=description, | |
| examples=examples_available_models, | |
| enable_queue=True, | |
| theme='huggingface') | |
| iface.launch() | |