import gradio as gr gr.Interface.load("models/soulteary/Chinese-Llama-2-7b-ggml-q4").launch()