import gradio as gr gr.load("models/Efficient-Large-Model/VILA-13b-4bit-awq").launch()