import gradio as gr gr.load("models/princeton-nlp/Sheared-LLaMA-1.3B").launch()