| from transformers import AutoTokenizer, AutoModelForCausalLM | |
| import gradio as gr | |
| tokenizer = AutoTokenizer.from_pretrained("huggyllama/llama-7b") | |
| model = AutoModelForCausalLM.from_pretrained("huggyllama/llama-7b") | |
| def chatbot_response(input_text): | |
| inputs = tokenizer(input_text, return_tensors="pt") | |
| outputs = model.generate(inputs['input_ids'], max_length=200, num_return_sequences=1) | |
| response = tokenizer.decode(outputs[0], skip_special_tokens=True) | |
| return response | |
| interface = gr.Interface(fn=chatbot_response, inputs="text", outputs="text", live=True) | |
| interface.launch() | |