Spaces:

OmPrakashSingh1704
/

ADVERTISE

Running

App Files Files Community

OmPrakashSingh1704 commited on Sep 18, 2024

Commit

25ef180

1 Parent(s): 06f6199

.

Browse files

Files changed (2) hide show

options/Video_model/Model.py +37 -28
options/Video_model/__pycache__/Model.cpython-310.pyc +0 -0

options/Video_model/Model.py CHANGED Viewed

@@ -1,26 +1,29 @@
-# import spaces
-import torch,os
-from diffusers import StableVideoDiffusionPipeline
-from diffusers.utils import load_image
 from PIL import Image
 from .tdd_svd_scheduler import TDDSVDStochasticIterativeScheduler
 from .utils import load_lora_weights, save_video
-from typing import Optional
 from glob import glob
 svd_path = 'stabilityai/stable-video-diffusion-img2vid-xt-1-1'
 lora_repo_path = 'RED-AIGC/TDD'
 lora_weight_name = 'svd-xt-1-1_tdd_lora_weights.safetensors'
-device="cuda" if torch.cuda.is_available() else "cpu"
-# if torch.cuda.is_available():
-noise_scheduler = TDDSVDStochasticIterativeScheduler(num_train_timesteps = 250, sigma_min = 0.002, sigma_max = 700.0, sigma_data = 1.0,
-                                                    s_noise = 1.0, rho = 7, clip_denoised = False)
-pipeline = StableVideoDiffusionPipeline.from_pretrained(svd_path, scheduler = noise_scheduler, torch_dtype = torch.float16, variant = "fp16").to(device)
-load_lora_weights(pipeline.unet, lora_repo_path, weight_name = lora_weight_name)
-# @spaces.GPU
 def Video(
     image: Image,
     seed: Optional[int] = 1,
@@ -36,30 +39,36 @@ def Video(
     motion_bucket_id: int = 127,
     output_folder: str = "outputs_gradio",
 ):
     pipeline.scheduler.set_eta(eta)
     if randomize_seed:
-        seed = random.randint(0, max_64_bit_int)
     generator = torch.manual_seed(seed)
-    image=Image.fromarray(image)
     os.makedirs(output_folder, exist_ok=True)
     base_count = len(glob(os.path.join(output_folder, "*.mp4")))
     video_path = os.path.join(output_folder, f"{base_count:06d}.mp4")
-    with torch.autocast(device):
         frames = pipeline(
-            image, height = height, width = width,
-            num_inference_steps = num_inference_steps,
-            min_guidance_scale = min_guidance_scale,
-            max_guidance_scale = max_guidance_scale,
-            num_frames = num_frames, fps = fps, motion_bucket_id = motion_bucket_id,
-            decode_chunk_size = 8,
-            noise_aug_strength = 0.02,
-            generator = generator,
         ).frames[0]
-    save_video(frames, video_path, fps = fps, quality = 5.0)
     torch.manual_seed(seed)
-    return video_path, seed

+import torch
 from PIL import Image
+import os
+from diffusers import StableVideoDiffusionPipeline
 from .tdd_svd_scheduler import TDDSVDStochasticIterativeScheduler
 from .utils import load_lora_weights, save_video
 from glob import glob
+from typing import Optional
+# Define paths and device
 svd_path = 'stabilityai/stable-video-diffusion-img2vid-xt-1-1'
 lora_repo_path = 'RED-AIGC/TDD'
 lora_weight_name = 'svd-xt-1-1_tdd_lora_weights.safetensors'
+device = "cuda" if torch.cuda.is_available() else "cpu"
+# Initialize the noise scheduler and pipeline
+noise_scheduler = TDDSVDStochasticIterativeScheduler(
+    num_train_timesteps=250, sigma_min=0.002, sigma_max=700.0,
+    sigma_data=1.0, s_noise=1.0, rho=7, clip_denoised=False
+)
+pipeline = StableVideoDiffusionPipeline.from_pretrained(
+    svd_path, scheduler=noise_scheduler, torch_dtype=torch.float16, variant="fp16"
+).to(device)
+load_lora_weights(pipeline.unet, lora_repo_path, weight_name=lora_weight_name)
+# Video function definition
 def Video(
     image: Image,
     seed: Optional[int] = 1,
     motion_bucket_id: int = 127,
     output_folder: str = "outputs_gradio",
 ):
+    # Set the eta value in the scheduler
     pipeline.scheduler.set_eta(eta)
+    # Handle seed randomness
     if randomize_seed:
+        seed = random.randint(0, 2**64 - 1)
     generator = torch.manual_seed(seed)
+    # Ensure the image is converted to a format that the model can use
+    image = Image.fromarray(image)
     os.makedirs(output_folder, exist_ok=True)
     base_count = len(glob(os.path.join(output_folder, "*.mp4")))
     video_path = os.path.join(output_folder, f"{base_count:06d}.mp4")
+    # Use float32 for image processing to avoid BFloat16 errors
+    image = image.convert("RGB")  # Ensure image is in RGB format
+    with torch.autocast(device, dtype=torch.float32):
         frames = pipeline(
+            image, height=height, width=width,
+            num_inference_steps=num_inference_steps,
+            min_guidance_scale=min_guidance_scale,
+            max_guidance_scale=max_guidance_scale,
+            num_frames=num_frames, fps=fps, motion_bucket_id=motion_bucket_id,
+            decode_chunk_size=8,
+            noise_aug_strength=0.02,
+            generator=generator,
         ).frames[0]
+    # Save the generated video
+    save_video(frames, video_path, fps=fps, quality=5.0)
     torch.manual_seed(seed)
+    return video_path, seed

options/Video_model/__pycache__/Model.cpython-310.pyc CHANGED Viewed

Binary files a/options/Video_model/__pycache__/Model.cpython-310.pyc and b/options/Video_model/__pycache__/Model.cpython-310.pyc differ