import gradio as gr gr.load("models/Efficient-Large-Model/VILA-7b-4bit-awq").launch()