import gradio as gr gr.load("models/Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4").launch()