Spaces:
Sleeping
Sleeping
import os | |
os.environ["GRADIO_TEMP_DIR"] = os.path.join(os.getcwd(), ".tmp_outputs") | |
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True" | |
import uuid | |
import gradio as gr | |
import spaces | |
from videosys import CogVideoXConfig, CogVideoXPABConfig, VideoSysEngine | |
PROMPT = "A modern living room with a minimalist design, featuring a large window, a white ceiling, and a wooden floor. The room is furnished with a white sofa, a gray ottoman, a wooden table, and a hanging light. The space is well-lit and has a clean, contemporary aesthetic." | |
def load_model(model_name, enable_video_sys=False, pab_threshold=[100, 850], pab_range=2): | |
pab_config = CogVideoXPABConfig(spatial_threshold=pab_threshold, spatial_range=pab_range) | |
config = CogVideoXConfig(model_name, enable_pab=enable_video_sys, pab_config=pab_config) | |
engine = VideoSysEngine(config) | |
return engine | |
def generate(engine, prompt, num_inference_steps=50, guidance_scale=6.0): | |
video = engine.generate(prompt, num_inference_steps=num_inference_steps, guidance_scale=guidance_scale).video[0] | |
unique_filename = f"{uuid.uuid4().hex}.mp4" | |
output_path = os.path.join("./.tmp_outputs", unique_filename) | |
engine.save_video(video, output_path) | |
return output_path | |
def generate_vs( | |
model_name, | |
prompt, | |
num_inference_steps, | |
guidance_scale, | |
threshold_start, | |
threshold_end, | |
gap, | |
progress=gr.Progress(track_tqdm=True), | |
): | |
threshold = [int(threshold_end), int(threshold_start)] | |
gap = int(gap) | |
engine = load_model(model_name, enable_video_sys=True, pab_threshold=threshold, pab_range=gap) | |
video_path = generate(engine, prompt, num_inference_steps, guidance_scale) | |
return video_path | |
css = """ | |
body { | |
font-family: Arial, sans-serif; | |
line-height: 1.6; | |
color: #333; | |
margin: 0 auto; | |
padding: 20px; | |
} | |
.container { | |
display: flex; | |
flex-direction: column; | |
gap: 10px; | |
} | |
.row { | |
display: flex; | |
flex-wrap: wrap; | |
gap: 10px; | |
} | |
.column { | |
flex: 1; | |
min-width: 0; | |
} | |
.video-output { | |
width: 100%; | |
max-width: 720px; | |
height: auto; | |
margin: 0 auto; | |
} | |
.server-status { | |
margin-top: 5px; | |
padding: 5px; | |
font-size: 0.8em; | |
} | |
.server-status h4 { | |
margin: 0 0 3px 0; | |
font-size: 0.9em; | |
} | |
.server-status .row { | |
margin-bottom: 2px; | |
} | |
.server-status .textbox { | |
min-height: unset !important; | |
} | |
.server-status .textbox input { | |
padding: 1px 5px !important; | |
height: 20px !important; | |
font-size: 0.9em !important; | |
} | |
.server-status .textbox label { | |
margin-bottom: 0 !important; | |
font-size: 0.9em !important; | |
line-height: 1.2 !important; | |
} | |
.server-status .textbox { | |
gap: 0 !important; | |
} | |
.server-status .textbox input { | |
margin-top: -2px !important; | |
} | |
@media (max-width: 768px) { | |
.row { | |
flex-direction: column; | |
} | |
.column { | |
width: 100%; | |
} | |
} | |
.video-output { | |
width: 100%; | |
height: auto; | |
} | |
} | |
""" | |
with gr.Blocks(css=css) as demo: | |
gr.HTML( | |
""" | |
<div style="text-align: center; font-size: 32px; font-weight: bold; margin-bottom: 20px;"> | |
KoolCogVideoX Huggingface Space🤗 | |
</div> | |
<div style="text-align: center; font-size: 15px; margin-bottom: 20px;"> | |
KoolCogVideoX is fine-tuned on <a href="https://huggingface.co/collections/THUDM/cogvideo-66c08e62f1685a3ade464cce">CogVideoX</a> specifically for interior design scenarios.<br> | |
The demo is powered by <a href="https://github.com/NUS-HPC-AI-Lab/VideoSys">https://github.com/NUS-HPC-AI-Lab/VideoSys</a>.<br> | |
⚠️ This demo is for academic research and experiential use only. Users should strictly adhere to local laws and ethics. | |
</div> | |
<div style="text-align: center;display: flex;justify-content: center;align-items: center;"> | |
Due to limited GPU quota, the 5B model cannot be run using GPU ZERO. You can duplicate this space and utilize your own resources to run the 5B model. | |
<a href="https://huggingface.co/spaces/bertjiazheng/KoolCogVideoX?duplicate=true"><img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/duplicate-this-space-lg.svg" width="160""></a> | |
</div> | |
""" | |
) | |
with gr.Row(): | |
with gr.Column(): | |
prompt = gr.Textbox(label="Prompt (Less than 200 Words)", value=PROMPT, lines=2) | |
with gr.Column(): | |
gr.Markdown("**Generation Parameters**<br>") | |
with gr.Row(): | |
model_name = gr.Radio( | |
["bertjiazheng/KoolCogVideoX-2b", "bertjiazheng/KoolCogVideoX-5b"], label="Model Type", value="bertjiazheng/KoolCogVideoX-2b" | |
) | |
with gr.Row(): | |
num_inference_steps = gr.Slider(label="Inference Steps", maximum=50, value=50) | |
guidance_scale = gr.Slider(label="Guidance Scale", value=6.0, maximum=15.0) | |
gr.Markdown("**Pyramid Attention Broadcast Parameters**<br>") | |
with gr.Row(): | |
pab_range = gr.Slider( | |
label="Broadcast Range", | |
value=2, | |
step=1, | |
minimum=1, | |
maximum=4, | |
info="Attention broadcast range.", | |
) | |
pab_threshold_start = gr.Slider( | |
label="Start Timestep", | |
minimum=500, | |
maximum=1000, | |
value=850, | |
step=1, | |
info="Broadcast start timestep (1000 is the fisrt).", | |
) | |
pab_threshold_end = gr.Slider( | |
label="End Timestep", | |
minimum=0, | |
maximum=500, | |
step=1, | |
value=100, | |
info="Broadcast end timestep (0 is the last).", | |
) | |
with gr.Row(): | |
generate_button_vs = gr.Button("⚡️ Generate Video with VideoSys") | |
with gr.Column(): | |
with gr.Row(): | |
video_output_vs = gr.Video(label="CogVideoX with VideoSys", width=720, height=480) | |
gr.Markdown(""" | |
<table border="0" style="width: 100%; text-align: left; margin-top: 20px;"> | |
<div style="text-align: center; font-size: 32px; font-weight: bold; margin-bottom: 20px;"> | |
🎥 Video Gallery | |
</div> | |
<div style="text-align: center; font-size: 15px;"> | |
These videos are generated by KoolCogVideoX-5b. | |
</div> | |
<tr> | |
<td style="width: 25%; vertical-align: top; font-size: 0.9em;"> | |
<p>A modern living room with a minimalist design, featuring a white sofa, a marble coffee table, a geometric painting, and a chandelier hanging from the ceiling. The room is well-lit with natural light, and the color scheme is neutral with accents of gold and black. The furniture is arranged in a way that creates a comfortable and inviting space. | |
</p> | |
</td> | |
<td style="width: 25%; vertical-align: top;"> | |
<video src="https://manycore-research-azure.kujiale.com/manycore-research/KoolCogVideoX-5b/L3D386S81B20ENDPDZEFIAUWJLWGLUFX7LB6KY8.mp4" width="100%" controls autoplay loop></video> | |
</td> | |
<td style="width: 25%; vertical-align: top; font-size: 0.9em;"> | |
<p>A modern living room with a minimalist design, featuring a large window, a white ceiling, and a wooden floor. The room is furnished with a white sofa, a gray ottoman, a wooden table, and a hanging light. The space is well-lit and has a clean, contemporary aesthetic.</p> | |
</td> | |
<td style="width: 25%; vertical-align: top;"> | |
<video src="https://manycore-research-azure.kujiale.com/manycore-research/KoolCogVideoX-5b/L3D489S267B0ENDPN7LV6QUWLYIALUFX4RSVTA8.mp4" width="100%" controls autoplay loop></video> | |
</td> | |
</tr> | |
<tr> | |
<td style="width: 25%; vertical-align: top; font-size: 0.9em;"> | |
<p>A modern bedroom with a minimalist design, featuring a large bed with a gray comforter and a blue blanket, a white dresser with a mirror, and a white closet. The room is decorated with framed artwork and a black and white poster on the wall. The floor is made of light wood, and the room has a clean and contemporary feel.</p> | |
</td> | |
<td style="width: 25%; vertical-align: top;"> | |
<video src="https://manycore-research-azure.kujiale.com/manycore-research/KoolCogVideoX-5b/L3D943S369B0ENDPNXSMXYUWLGWQLUFX6ZZZWA8.mp4" width="100%" controls autoplay loop></video> | |
</td> | |
<td style="width: 25%; vertical-align: top; font-size: 0.9em;"> | |
<p>A modern kitchen with a sleek design, featuring a marble countertop, stainless steel appliances, and a variety of bottles and glasses. The kitchen is well-lit with recessed lighting and has a contemporary aesthetic.</p> | |
</td> | |
<td style="width: 25%; vertical-align: top;"> | |
<video src="https://manycore-research-azure.kujiale.com/manycore-research/KoolCogVideoX-5b/L3D670S366B0ENDPOAJ4LQUWJN2ILUFX5GLPRQ8.mp4" width="100%" controls autoplay loop></video> | |
</td> | |
</tr> | |
</table> | |
""") | |
generate_button_vs.click( | |
generate_vs, | |
inputs=[ | |
model_name, | |
prompt, | |
num_inference_steps, | |
guidance_scale, | |
pab_threshold_start, | |
pab_threshold_end, | |
pab_range, | |
], | |
outputs=[video_output_vs], | |
concurrency_id="gen", | |
concurrency_limit=1, | |
) | |
if __name__ == "__main__": | |
demo.queue(max_size=10, default_concurrency_limit=1) | |
demo.launch() | |