import gradio as gr gr.Interface.load("models/Neko-Institute-of-Science/LLaMA-13B-4bit-128g").launch()