Spaces:

TIGER-Lab
/

AnyV2V

Running on Zero

App Files Files Community

vinesmsuic commited on Apr 24

Commit

f2d9a72

•

1 Parent(s): 6b98080

stable

Browse files

Files changed (4) hide show

app.py +4 -5
app_ip2p.py → app_cosxl.py +5 -4
black_box_image_edit/cosxl_edit.py +2 -0
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -14,8 +14,7 @@ from PIL import Image
 import torch
 import numpy as np
-from black_box_image_edit.cosxl_edit import CosXLEdit
-#from black_box_image_edit.instructpix2pix import InstructPix2Pix
 from prepare_video import crop_and_resize_video
 from edit_image import infer_video
@@ -41,7 +40,7 @@ demo_examples = [
 TEMP_DIR = "_demo_temp"
-image_edit_model = CosXLEdit()
 @torch.no_grad()
 @spaces.GPU(duration=30)
@@ -316,7 +315,7 @@ with gr.Blocks() as demo:
     gr.Markdown("Official 🤗 Gradio demo for [AnyV2V: A Plug-and-Play Framework For Any Video-to-Video Editing Tasks](https://tiger-ai-lab.github.io/AnyV2V/)")
     with gr.Tabs():
-        with gr.TabItem('AnyV2V(I2VGenXL) + CosXLEdit'):
             gr.Markdown("# Preprocessing Video Stage")
             gr.Markdown("In this demo, AnyV2V only support video with 2 seconds duration and 8 fps. If your video is not in this format, we will preprocess it for you. Click on the Preprocess video button!")
             with gr.Row():
@@ -340,7 +339,7 @@ with gr.Blocks() as demo:
                             pv_longest_to_width = gr.Checkbox(label="Resize Longest Dimension to Width")
             gr.Markdown("# Image Editing Stage")
-            gr.Markdown("Edit the first frame of the video to your liking! Click on the Edit the first frame button after inputting the editing instruction prompt. This image editing stage is powered by CosXLEdit. You can try edit the image multiple times until you are happy with the result! You can also choose to download the first frame of the video and edit it with other software (e.g. Photoshop, GIMP, etc.) or use other image editing models to obtain the edited frame and upload it directly.")
             with gr.Row():
                 with gr.Column():
                     src_first_frame = gr.Image(label="First Frame", type="filepath", interactive=False)

 import torch
 import numpy as np
+from black_box_image_edit.instructpix2pix import InstructPix2Pix
 from prepare_video import crop_and_resize_video
 from edit_image import infer_video
 TEMP_DIR = "_demo_temp"
+image_edit_model = InstructPix2Pix()
 @torch.no_grad()
 @spaces.GPU(duration=30)
     gr.Markdown("Official 🤗 Gradio demo for [AnyV2V: A Plug-and-Play Framework For Any Video-to-Video Editing Tasks](https://tiger-ai-lab.github.io/AnyV2V/)")
     with gr.Tabs():
+        with gr.TabItem('AnyV2V(I2VGenXL) + InstructPix2Pix'):
             gr.Markdown("# Preprocessing Video Stage")
             gr.Markdown("In this demo, AnyV2V only support video with 2 seconds duration and 8 fps. If your video is not in this format, we will preprocess it for you. Click on the Preprocess video button!")
             with gr.Row():
                             pv_longest_to_width = gr.Checkbox(label="Resize Longest Dimension to Width")
             gr.Markdown("# Image Editing Stage")
+            gr.Markdown("Edit the first frame of the video to your liking! Click on the Edit the first frame button after inputting the editing instruction prompt. This image editing stage is powered by InstructPix2Pix. You can try edit the image multiple times until you are happy with the result! You can also choose to download the first frame of the video and edit it with other software (e.g. Photoshop, GIMP, etc.) or use other image editing models to obtain the edited frame and upload it directly.")
             with gr.Row():
                 with gr.Column():
                     src_first_frame = gr.Image(label="First Frame", type="filepath", interactive=False)

app_ip2p.py → app_cosxl.py RENAMED Viewed

@@ -14,7 +14,8 @@ from PIL import Image
 import torch
 import numpy as np
-from black_box_image_edit.instructpix2pix import InstructPix2Pix
 from prepare_video import crop_and_resize_video
 from edit_image import infer_video
@@ -40,7 +41,7 @@ demo_examples = [
 TEMP_DIR = "_demo_temp"
-image_edit_model = InstructPix2Pix()
 @torch.no_grad()
 @spaces.GPU(duration=30)
@@ -315,7 +316,7 @@ with gr.Blocks() as demo:
     gr.Markdown("Official 🤗 Gradio demo for [AnyV2V: A Plug-and-Play Framework For Any Video-to-Video Editing Tasks](https://tiger-ai-lab.github.io/AnyV2V/)")
     with gr.Tabs():
-        with gr.TabItem('AnyV2V(I2VGenXL) + InstructPix2Pix'):
             gr.Markdown("# Preprocessing Video Stage")
             gr.Markdown("In this demo, AnyV2V only support video with 2 seconds duration and 8 fps. If your video is not in this format, we will preprocess it for you. Click on the Preprocess video button!")
             with gr.Row():
@@ -339,7 +340,7 @@ with gr.Blocks() as demo:
                             pv_longest_to_width = gr.Checkbox(label="Resize Longest Dimension to Width")
             gr.Markdown("# Image Editing Stage")
-            gr.Markdown("Edit the first frame of the video to your liking! Click on the Edit the first frame button after inputting the editing instruction prompt. This image editing stage is powered by InstructPix2Pix. You can try edit the image multiple times until you are happy with the result! You can also choose to download the first frame of the video and edit it with other software (e.g. Photoshop, GIMP, etc.) or use other image editing models to obtain the edited frame and upload it directly.")
             with gr.Row():
                 with gr.Column():
                     src_first_frame = gr.Image(label="First Frame", type="filepath", interactive=False)

 import torch
 import numpy as np
+from black_box_image_edit.cosxl_edit import CosXLEdit
+#from black_box_image_edit.instructpix2pix import InstructPix2Pix
 from prepare_video import crop_and_resize_video
 from edit_image import infer_video
 TEMP_DIR = "_demo_temp"
+image_edit_model = CosXLEdit()
 @torch.no_grad()
 @spaces.GPU(duration=30)
     gr.Markdown("Official 🤗 Gradio demo for [AnyV2V: A Plug-and-Play Framework For Any Video-to-Video Editing Tasks](https://tiger-ai-lab.github.io/AnyV2V/)")
     with gr.Tabs():
+        with gr.TabItem('AnyV2V(I2VGenXL) + CosXLEdit'):
             gr.Markdown("# Preprocessing Video Stage")
             gr.Markdown("In this demo, AnyV2V only support video with 2 seconds duration and 8 fps. If your video is not in this format, we will preprocess it for you. Click on the Preprocess video button!")
             with gr.Row():
                             pv_longest_to_width = gr.Checkbox(label="Resize Longest Dimension to Width")
             gr.Markdown("# Image Editing Stage")
+            gr.Markdown("Edit the first frame of the video to your liking! Click on the Edit the first frame button after inputting the editing instruction prompt. This image editing stage is powered by CosXLEdit. You can try edit the image multiple times until you are happy with the result! You can also choose to download the first frame of the video and edit it with other software (e.g. Photoshop, GIMP, etc.) or use other image editing models to obtain the edited frame and upload it directly.")
             with gr.Row():
                 with gr.Column():
                     src_first_frame = gr.Image(label="First Frame", type="filepath", interactive=False)

black_box_image_edit/cosxl_edit.py CHANGED Viewed

@@ -28,6 +28,8 @@ class CosXLEdit():
         )
         self.pipe.scheduler = EDMEulerScheduler(sigma_min=0.002, sigma_max=120.0, sigma_data=1.0, prediction_type="v_prediction")
         self.pipe.to(device)
     def infer_one_image(self, src_image: PIL.Image.Image = None, src_prompt: str = None, target_prompt: str = None, instruct_prompt: str = None, seed: int = 42, negative_prompt=""):
         """

         )
         self.pipe.scheduler = EDMEulerScheduler(sigma_min=0.002, sigma_max=120.0, sigma_data=1.0, prediction_type="v_prediction")
         self.pipe.to(device)
+        self.pipe.enable_vae_tiling()
+        self.pipe.enable_model_cpu_offload()
     def infer_one_image(self, src_image: PIL.Image.Image = None, src_prompt: str = None, target_prompt: str = None, instruct_prompt: str = None, seed: int = 42, negative_prompt=""):
         """

requirements.txt CHANGED Viewed

@@ -1,7 +1,7 @@
 torch==2.1.0
 torchvision==0.16.0
 accelerate
-diffusers==0.27.0
 transformers
 omegaconf
 opencv-python

 torch==2.1.0
 torchvision==0.16.0
 accelerate
+diffusers==0.26.3
 transformers
 omegaconf
 opencv-python