Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| from llama_cpp import Llama | |
| # Initialize the Llama model with GGUF format | |
| llm = Llama(model_path="./models/mistral-7b-instruct-v0.2.Q4_K_M.gguf", n_ctx=2048) | |
| # Function to generate response | |
| def generate_response(prompt): | |
| output = llm(prompt, max_tokens=200, stop=["</s>"]) | |
| return output["choices"][0]["text"] | |
| # Gradio interface to interact with the model | |
| def chat(prompt): | |
| return generate_response(prompt) | |
| # Creating the Gradio interface | |
| iface = gr.Interface(fn=chat, inputs="text", outputs="text", live=True) | |
| iface.launch() | |