import gradio as gr gr.Interface.load("models/TheBloke/Llama-2-13B-Chat-fp16").launch()