import gradio as gr gr.Interface.load("models/princeton-nlp/Sheared-LLaMA-2.7B").launch()