Mochi1

Runtime error

App Files Files Community

Haoxin Chen commited on Apr 11, 2023

Commit

0757c55

1 Parent(s): 1e5bda6

add videocontrol code

Browse files

Files changed (5) hide show

.gitignore +4 -1
app.py +6 -4
demo_test.py +1 -1
input/flamingo.mp4 +0 -0
videocontrol_test.py +131 -0

.gitignore CHANGED Viewed

@@ -1,7 +1,10 @@
 .DS_Store
 *pyc
 __pycache__
 *.egg-info
 results
-*.ckpt

 .DS_Store
 *pyc
+.vscode
 __pycache__
 *.egg-info
 results
+*.ckpt
+*.pt
+*.pth

app.py CHANGED Viewed

@@ -1,7 +1,8 @@
 import os
 import sys
 import gradio as gr
-from demo_test import Text2Video, VideoContorl
 sys.path.insert(1, os.path.join(sys.path[0], 'lvdm'))
 t2v_examples = [
@@ -14,12 +15,12 @@ t2v_examples = [
 ]
 control_examples = [
-    ['01.mp4', 'a dog', 0, 50, 15, 1]
 ]
 def videocrafter_demo(result_dir='./tmp/'):
     text2video = Text2Video(result_dir)
-    videocontrol = VideoContorl()
     with gr.Blocks(analytics_enabled=False) as videocrafter_iface:
         gr.Markdown("<div align='center'> <h2> VideoCrafter: A Toolkit for Text-to-Video Generation and Editing </span> </h2> \
                      <a style='font-size:18px;color: #efefef' href='https://github.com/VideoCrafter/VideoCrafter'> Github </div>")
@@ -89,4 +90,5 @@ def videocrafter_demo(result_dir='./tmp/'):
 if __name__ == "__main__":
     result_dir = os.path.join('./', 'results')
     videocrafter_iface = videocrafter_demo(result_dir)
-    videocrafter_iface.launch(server_name='0.0.0.0', server_port=80)

 import os
 import sys
 import gradio as gr
+from videocrafter_test import Text2Video
+from videocontrol_test import VideoControl
 sys.path.insert(1, os.path.join(sys.path[0], 'lvdm'))
 t2v_examples = [
 ]
 control_examples = [
+    ['input/flamingo.mp4', 'An ostrich walking in the desert, photorealistic, 4k', 0, 50, 15, 1]
 ]
 def videocrafter_demo(result_dir='./tmp/'):
     text2video = Text2Video(result_dir)
+    videocontrol = VideoControl(result_dir)
     with gr.Blocks(analytics_enabled=False) as videocrafter_iface:
         gr.Markdown("<div align='center'> <h2> VideoCrafter: A Toolkit for Text-to-Video Generation and Editing </span> </h2> \
                      <a style='font-size:18px;color: #efefef' href='https://github.com/VideoCrafter/VideoCrafter'> Github </div>")
 if __name__ == "__main__":
     result_dir = os.path.join('./', 'results')
     videocrafter_iface = videocrafter_demo(result_dir)
+    videocrafter_iface.launch()
+    # videocrafter_iface.launch(server_name='0.0.0.0', server_port=80)

demo_test.py CHANGED Viewed

@@ -6,7 +6,7 @@ class Text2Video():
         return '01.mp4'
-class VideoContorl:
     def __init__(self) -> None:
         pass

         return '01.mp4'
+class VideoControl:
     def __init__(self) -> None:
         pass

input/flamingo.mp4 ADDED Viewed

Binary file (897 kB). View file

videocontrol_test.py ADDED Viewed

	@@ -0,0 +1,131 @@

+import argparse, os, sys, glob
+import datetime, time
+from omegaconf import OmegaConf
+import math
+import torch
+from decord import VideoReader, cpu
+import torchvision
+from pytorch_lightning import seed_everything
+from lvdm.samplers.ddim import DDIMSampler
+from lvdm.utils.common_utils import instantiate_from_config
+from lvdm.utils.saving_utils import tensor_to_mp4
+from scripts.sample_text2video_adapter import load_model_checkpoint, adapter_guided_synthesis
+import torchvision.transforms._transforms_video as transforms_video
+from huggingface_hub import hf_hub_download
+def load_video(filepath, frame_stride, video_size=(256,256), video_frames=16):
+    info_str = ''
+    vidreader = VideoReader(filepath, ctx=cpu(0), width=video_size[1], height=video_size[0])
+    max_frames = len(vidreader)
+    # auto
+    if frame_stride != 0:
+        if frame_stride * (video_frames-1) >= max_frames:
+            info_str += "Warning: The user-set frame rate makes the current video length not enough, we will set it to an adaptive frame rate.\n"
+            frame_stride = 0
+    if frame_stride == 0:
+        frame_stride = max_frames / video_frames
+        # if temp_stride < 1:
+            # info_str = "Warning: The length of the current input video is less than 16 frames, we will automatically fill to 16 frames for you.\n"
+    if frame_stride > 8:
+        frame_stride = 8
+        info_str += "Warning: The current input video length is longer than 128 frames, we will process only the first 128 frames.\n"
+    info_str += f"Frame Stride is set to {frame_stride}"
+    frame_indices = [int(frame_stride*i) for i in range(video_frames)]
+    frames = vidreader.get_batch(frame_indices)
+    ## [t,h,w,c] -> [c,t,h,w]
+    frame_tensor = torch.tensor(frames.asnumpy()).permute(3, 0, 1, 2).float()
+    frame_tensor = (frame_tensor / 255. - 0.5) * 2
+    return frame_tensor, info_str
+class VideoControl:
+    def __init__(self, result_dir='./tmp/') -> None:
+        self.savedir = result_dir
+        self.download_model()
+        config_path = "models/adapter_t2v_depth/model_config.yaml"
+        ckpt_path = "models/base_t2v/model.ckpt"
+        adapter_ckpt = "models/adapter_t2v_depth/adapter.pth"
+        config = OmegaConf.load(config_path)
+        model_config = config.pop("model", OmegaConf.create())
+        model = instantiate_from_config(model_config)
+        model = model.to('cuda')
+        assert os.path.exists(ckpt_path), "Error: checkpoint Not Found!"
+        model = load_model_checkpoint(model, ckpt_path, adapter_ckpt)
+        model.eval()
+        self.model = model
+        self.resolution=256
+        self.spatial_transform = transforms_video.CenterCropVideo(self.resolution)
+    def get_video(self, input_video, input_prompt, frame_stride=0, vc_steps=50, vc_cfg_scale=15.0, vc_eta=1.0):
+        ## load video
+        print("input video", input_video)
+        info_str = ''
+        try:
+            h, w, c = VideoReader(input_video, ctx=cpu(0))[0].shape
+        except:
+            os.remove(input_video)
+            return 'please input video', None
+        if h < w:
+            scale = h / self.resolution
+        else:
+            scale = w / self.resolution
+        h = math.ceil(h / scale)
+        w = math.ceil(w / scale)
+        try:
+            video, info_str = load_video(input_video, frame_stride, video_size=(h, w), video_frames=16)
+        except:
+            os.remove(input_video)
+            return 'load video error', None
+        video = self.spatial_transform(video)
+        print('video shape', video.shape)
+        h, w = 32, 32
+        bs = 1
+        channels = self.model.channels
+        frames = self.model.temporal_length
+        noise_shape = [bs, channels, frames, h, w]
+        ## inference
+        start = time.time()
+        prompt = input_prompt
+        video = video.unsqueeze(0).to("cuda")
+        with torch.no_grad():
+            batch_samples, batch_conds = adapter_guided_synthesis(self.model, prompt, video, noise_shape, n_samples=1, ddim_steps=vc_steps, ddim_eta=vc_eta, unconditional_guidance_scale=vc_cfg_scale)
+        batch_samples = batch_samples[0]
+        os.makedirs(self.savedir, exist_ok=True)
+        filename = prompt
+        filename = filename.replace("/", "_slash_") if "/" in filename else filename
+        filename = filename.replace(" ", "_") if " " in filename else filename
+        video_path = os.path.join(self.savedir, f'{filename}_sample.mp4')
+        # tensor_to_mp4(video=batch_conds.detach().cpu(), savepath=os.path.join(self.savedir, f'{filename}_depth.mp4'), fps=10)
+        tensor_to_mp4(video=batch_samples.detach().cpu(), savepath=os.path.join(self.savedir, f'{filename}_sample.mp4'), fps=8)
+        print(f"Saved in {video_path}. Time used: {(time.time() - start):.2f} seconds")
+        # delete video
+        os.remove(input_video)
+        return info_str, video_path
+    def download_model(self):
+        REPO_ID = 'VideoCrafter/t2v-version-1-1'
+        filename_list = ['models/base_t2v/model.ckpt',
+                         "models/adapter_t2v_depth/adapter.pth"
+                         "models/adapter_t2v_depth/dpt_hybrid-midas.pt"
+                        ]
+        for filename in filename_list:
+            if not os.path.exists(filename):
+                hf_hub_download(repo_id=REPO_ID, filename=filename, local_dir='./', local_dir_use_symlinks=False)
+if __name__ == "__main__":
+    vc = VideoControl('./result')
+    info_str, video_path =  vc.get_video('input/flamingo.mp4',"An ostrich walking in the desert, photorealistic, 4k")