VideoLLaMA2-AV

Running on Zero

App Files Files Community

lixin4ever

ZYX123 commited on Oct 23

Commit

a5deedf

•

1 Parent(s): e52682b

add requirements.txt (#3)

Browse files

- add requirements.txt (e818756da384130f584390d4c7707ecf72384d29)
- add requirements.txt (0658a9d415b8cd677486731ecac8757a4d15f2a3)

Co-authored-by: yongxinzhu <zyx123@users.noreply.huggingface.co>

Files changed (2) hide show

app.py +2 -2
requirements.txt +41 -0

app.py CHANGED Viewed

@@ -321,11 +321,11 @@ with gr.Blocks(title='VideoLLaMA 2 🔥🚀🔥', theme=theme, css=block_css) as
                 examples=[
                     [
                         f"{cur_dir}/examples/00000368.mp4",
-                        "Where is the loudest instrument?",
                     ],
                     [
                         f"{cur_dir}/examples/00003491.mp4",
-                        "Is the instrument on the left louder than the instrument on the right?",
                     ],
                 ],
                 inputs=[video, textbox],

                 examples=[
                     [
                         f"{cur_dir}/examples/00000368.mp4",
+                        "Please describe the video with audio information:",
                     ],
                     [
                         f"{cur_dir}/examples/00003491.mp4",
+                        "Where is the loudest instrument?",
                     ],
                 ],
                 inputs=[video, textbox],

requirements.txt ADDED Viewed

	@@ -0,0 +1,41 @@

+# basic dependencies
+torch==2.2.0
+torchaudio==2.2.0
+torchvision==0.17.0
+transformers==4.42.3
+tokenizers==0.19.1
+deepspeed==0.13.1
+accelerate==0.26.1
+peft==0.4.0
+timm==1.0.3
+numpy==1.24.4
+# data processing
+decord==0.6.0
+imageio==2.34.0
+imageio-ffmpeg==0.4.9
+moviepy==1.0.3
+scenedetect==0.6.3
+opencv-python==4.6.0.66
+pysubs2
+librosa
+pytorchvideo
+# misc
+scikit-learn==1.2.2
+huggingface_hub==0.23.4
+sentencepiece==0.1.99
+shortuuid
+einops==0.6.1
+einops-exts==0.0.4
+bitsandbytes==0.43.0
+pydantic>=2.0
+markdown2[all]
+gradio==3.50.0
+gradio_client==0.6.1
+httpx==0.24.1
+openai==1.33.0
+requests
+uvicorn
+fastapi
+tensorboard
+wandb
+tabulate