import argparse import imageio import numpy as np import gradio as gr from PIL import Image from demo.motiondirector import MotionDirector runner = MotionDirector() def motiondirector(model_select, text_pormpt, neg_text_pormpt, random_seed=1, steps=25, guidance_scale=7.5, baseline_select=False): return runner(model_select, text_pormpt, neg_text_pormpt, int(random_seed) if random_seed != "" else 1, int(steps), float(guidance_scale), baseline_select) with gr.Blocks() as demo: gr.HTML( """
""") with gr.Row(): generated_video_baseline = gr.Video(format="mp4", label="Video Generated by base model (ZeroScope with same seed)") generated_video = gr.Video(format="mp4", label="Video Generated by MotionDirector") with gr.Column(): baseline_select = gr.Checkbox(label="Compare with baseline (ZeroScope with same seed)", info="Run baseline? Note: Inference time will be doubled.") random_seed = gr.Textbox(label="Random seed", value=1, info="default: 1") sampling_steps = gr.Textbox(label="Sampling steps", value=30, info="default: 30") guidance_scale = gr.Textbox(label="Guidance scale", value=12, info="default: 12") with gr.Row(): model_select = gr.Dropdown( ["1-1: [Cinematic Shots] -- Dolly Zoom (Hitchcockian Zoom)", "1-2: [Cinematic Shots] -- Zoom In", "1-3: [Cinematic Shots] -- Zoom Out", "2-1: [Object Trajectory] -- Right to Left", "2-2: [Object Trajectory] -- Left to Right", "3-1: [Sports Concepts] -- Riding Bicycle", "3-2: [Sports Concepts] -- Riding Horse", "3-3: [Sports Concepts] -- Lifting Weights", "3-4: [Sports Concepts] -- Playing Golf" ], label="MotionDirector", info="Which MotionDirector would you like to use!" ) text_pormpt = gr.Textbox(label="Text Prompt", value='', placeholder="Input your text prompt here!") neg_text_pormpt = gr.Textbox(label="Negative Text Prompt", value='', placeholder="default: None") submit = gr.Button("Generate") # when the `submit` button is clicked submit.click( motiondirector, [model_select, text_pormpt, neg_text_pormpt, random_seed, sampling_steps, guidance_scale, baseline_select], [generated_video, generated_video_baseline] ) # Examples gr.Markdown("## Examples") gr.Examples( fn=motiondirector, examples=[ ["1-1: [Cinematic Shots] -- Dolly Zoom (Hitchcockian Zoom)", "A lion sitting on top of a cliff captured with a dolly zoom.", 1675932], ["1-2: [Cinematic Shots] -- Zoom In", "A firefighter standing in front of a burning forest captured with a zoom in.", 1429227], ["1-3: [Cinematic Shots] -- Zoom Out", "A lion sitting on top of a cliff captured with a zoom out.", 1767994], ["2-1: [Object Trajectory] -- Right to Left", "A tank is running on the moon.", 8551187], ["2-2: [Object Trajectory] -- Left to Right", "A tiger is running in the forest.", 3463673], ["3-1: [Sports Concepts] -- Riding Bicycle", "An astronaut is riding a bicycle past the pyramids Mars 4K high quailty highly detailed.", 4422954], ["3-2: [Sports Concepts] -- Riding Horse", "A man riding an elephant through the jungle.", 6230765], ["3-3: [Sports Concepts] -- Lifting Weights", "A panda is lifting weights in a garden.", 1699276], ["3-4: [Sports Concepts] -- Playing Golf", "A man is playing golf in front of the White House.", 8870450], ], inputs=[model_select, text_pormpt, random_seed], outputs=generated_video, ) demo.queue(max_size=15) demo.launch(share=False)