Spaces:
Running
on
Zero
Running
on
Zero
4 bit load.
Browse files
app.py
CHANGED
@@ -220,8 +220,8 @@ if __name__ == '__main__':
|
|
220 |
conv_mode = "llama_2"
|
221 |
model_path = 'DAMO-NLP-SG/VideoLLaMA2-7B'
|
222 |
|
223 |
-
handler = Chat(model_path, conv_mode=conv_mode, load_8bit=
|
224 |
-
handler.model.to(dtype=torch.float16)
|
225 |
|
226 |
if not os.path.exists("temp"):
|
227 |
os.makedirs("temp")
|
|
|
220 |
conv_mode = "llama_2"
|
221 |
model_path = 'DAMO-NLP-SG/VideoLLaMA2-7B'
|
222 |
|
223 |
+
handler = Chat(model_path, conv_mode=conv_mode, load_8bit=False, load_4bit=True, device='cuda')
|
224 |
+
# handler.model.to(dtype=torch.float16)
|
225 |
|
226 |
if not os.path.exists("temp"):
|
227 |
os.makedirs("temp")
|