import gradio as gr # Set the model name and load the tokenizer and configuration for the model MODEL_NAME = "models/dontito/llama-7b-hf-v0" gr.Interface.load(MODEL_NAME).launch(debug=True)