import gradio as gr gr.Interface.load("models/soulteary/Chinese-Llama-2-7b-4bit").launch()