Spaces:

yapzanan
/

testNLLB

Runtime error

App Files Files Community

testNLLB / app.py

yapzanan

Update app.py

918fd7f over 1 year ago

raw history blame

No virus

3.12 kB

	import os
	import torch
	import gradio as gr
	import time
	import threading
	from flask import Flask, request
	from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
	from flores200_codes import flores_codes


	def load_models():
	# build model and tokenizer
	model_name_dict = {
	# 'nllb-distilled-600M': 'facebook/nllb-200-distilled-600M',
	# 'nllb-1.3B': 'facebook/nllb-200-1.3B',
	'nllb-distilled-1.3B': 'facebook/nllb-200-distilled-1.3B',
	# 'nllb-3.3B': 'facebook/nllb-200-3.3B',
	}

	model_dict = {}

	for call_name, real_name in model_name_dict.items():
	print('\tLoading model: %s' % call_name)
	model = AutoModelForSeq2SeqLM.from_pretrained(real_name)
	tokenizer = AutoTokenizer.from_pretrained(real_name)
	model_dict[call_name + '_model'] = model
	model_dict[call_name + '_tokenizer'] = tokenizer

	return model_dict


	def translation(source, target, text):
	if len(model_dict) == 2:
	model_name = 'nllb-distilled-1.3B'

	start_time = time.time()
	source = flores_codes[source]
	target = flores_codes[target]

	model = model_dict[model_name + '_model']
	tokenizer = model_dict[model_name + '_tokenizer']

	translator = pipeline('translation', model=model, tokenizer=tokenizer, src_lang=source, tgt_lang=target)
	output = translator(text, max_length=400)

	end_time = time.time()

	full_output = output
	output = output[0]['translation_text']
	result = {'inference_time': end_time - start_time,
	'source': source,
	'target': target,
	'result': output,
	'full_output': full_output}
	return result


	def start_flask():
	app = Flask(__name__)

	@app.route('/translate', methods=['POST'])
	def translate():
	source = request.form['source']
	target = request.form['target']
	text = request.form['text']
	result = translation(source, target, text)
	return result

	app.run()


	if __name__ == '__main__':
	print('\tinit models')

	global model_dict

	model_dict = load_models()

	# define gradio demo
	lang_codes = list(flores_codes.keys())
	# inputs = [gr.inputs.Radio(['nllb-distilled-600M', 'nllb-1.3B', 'nllb-distilled-1.3B'], label='NLLB Model'),
	inputs = [gr.inputs.Dropdown(lang_codes, default='Yue Chinese', label='Source'),
	gr.inputs.Dropdown(lang_codes, default='English', label='Target'),
	gr.inputs.Textbox(lines=5, label="Input text"),
	]

	outputs = gr.outputs.JSON()

	title = "NLLB distilled 1.3B distilled demo"

	demo_status = "Demo is running on CPU"
	description = f"Details: https://github.com/facebookresearch/fairseq/tree/nllb. {demo_status}"
	examples = [
	['Yue Chinese', 'English', '你食咗飯未?']
	]

	gr.Interface(translation,
	inputs,
	outputs,
	title=title,
	description=description,
	examples=examples,
	examples_per_page=50,
	).launch(share=True)