Spaces:
Runtime error
Runtime error
"""#Imports""" | |
#!pip install transformers gradio accelerate bitsandbytes sentencepiece | |
import multiprocessing | |
import torch | |
from transformers import T5Tokenizer, T5ForConditionalGeneration | |
import gradio as gr | |
"""#Code""" | |
device = "cuda:0" if torch.cuda.is_available() else "cpu" | |
"""##FP 32""" | |
tokenizer = T5Tokenizer.from_pretrained("google/flan-t5-xl") | |
model = T5ForConditionalGeneration.from_pretrained("google/flan-t5-xl", device_map="auto") | |
"""###Interface""" | |
def generate(input_text, minimum_length, maximum_length, beam_amount, temperature, length_penalty, repetition_penalty): | |
input_ids = tokenizer(input_text, return_tensors="pt").input_ids.to(device) | |
outputs = model.generate(input_ids, | |
min_length=minimum_length, | |
max_new_tokens=maximum_length, | |
length_penalty=length_penalty, | |
num_beams=beam_amount, | |
no_repeat_ngram_size=3, | |
temperature=temperature, | |
top_k=100, | |
top_p=0.9, | |
repetition_penalty=repetition_penalty, | |
) | |
return tokenizer.decode(outputs[0], skip_special_tokens=True).capitalize() | |
title = "Flan-T5-XL Inference on GRADIO GUI" | |
def inference(input_text, minimum_length, maximum_length, beam_amount, temperature, length_penalty, repetition_penalty): | |
return generate(input_text, minimum_length, maximum_length, beam_amount, temperature, length_penalty, repetition_penalty) | |
io = gr.Interface( | |
fn=inference, | |
inputs=[gr.Textbox(lines=4), gr.Slider(0, 300), gr.Slider(100, 2000), gr.Slider(1, 12, step=1), gr.Slider(0, 2, step=0.1), gr.Slider(1, 3, step=0.1)], | |
outputs=[ | |
gr.Textbox(lines=2, label="Flan-T5-XL Inference") | |
], | |
title=title, | |
css=""" | |
body {background-color: lightgreen} | |
.input_text input { | |
background-color: lightblue !important; | |
} | |
""" | |
) | |
io.launch(share=False, debug=False) |