Chat-UniVi
commited on
Commit
•
66c1e7f
1
Parent(s):
c89d507
Update README.md
Browse files
README.md
CHANGED
@@ -1,6 +1,15 @@
|
|
1 |
---
|
2 |
license: llama2
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
## 😮 Highlights
|
5 |
|
6 |
### 💡 Unified visual representation for image and video
|
@@ -90,7 +99,7 @@ def _get_rawvideo_dec(video_path, image_processor, max_frames=MAX_IMAGE_LENGTH,
|
|
90 |
|
91 |
if __name__ == '__main__':
|
92 |
# Model Parameter
|
93 |
-
model_path =
|
94 |
video_path = ${video_path}
|
95 |
max_frames = ${max_frames}
|
96 |
|
@@ -188,7 +197,7 @@ from PIL import Image
|
|
188 |
|
189 |
if __name__ == '__main__':
|
190 |
# Model Parameter
|
191 |
-
model_path =
|
192 |
image_path = ${image_path}
|
193 |
|
194 |
# Input Text
|
|
|
1 |
---
|
2 |
license: llama2
|
3 |
---
|
4 |
+
# Chat-UniVi: Unified Visual Representation Empowers Large Language Models with Image and Video Understanding
|
5 |
+
|
6 |
+
**Paper or resources for more information:**
|
7 |
+
[[Paper](https://huggingface.co/papers/2311.08046)] [[Code](https://github.com/PKU-YuanGroup/Chat-UniVi)]
|
8 |
+
|
9 |
+
## License
|
10 |
+
Llama 2 is licensed under the LLAMA 2 Community License,
|
11 |
+
Copyright (c) Meta Platforms, Inc. All Rights Reserved.
|
12 |
+
|
13 |
## 😮 Highlights
|
14 |
|
15 |
### 💡 Unified visual representation for image and video
|
|
|
99 |
|
100 |
if __name__ == '__main__':
|
101 |
# Model Parameter
|
102 |
+
model_path = "Chat-UniVi/Chat-UniVi" # or "Chat-UniVi/Chat-UniVi-13B"
|
103 |
video_path = ${video_path}
|
104 |
max_frames = ${max_frames}
|
105 |
|
|
|
197 |
|
198 |
if __name__ == '__main__':
|
199 |
# Model Parameter
|
200 |
+
model_path = "Chat-UniVi/Chat-UniVi" # or "Chat-UniVi/Chat-UniVi-13B"
|
201 |
image_path = ${image_path}
|
202 |
|
203 |
# Input Text
|