Spaces:
Runtime error
Runtime error
unsubscribe
commited on
Commit
•
3ee9c74
1
Parent(s):
ec64302
change model_repo_id
Browse files
app.py
CHANGED
@@ -5,7 +5,7 @@ from lmdeploy.serve.gradio.turbomind_coupled import *
|
|
5 |
from lmdeploy.messages import TurbomindEngineConfig
|
6 |
|
7 |
backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05, model_format='awq')
|
8 |
-
model_path = 'internlm/internlm2_5-7b-chat-
|
9 |
|
10 |
InterFace.async_engine = AsyncEngine(
|
11 |
model_path=model_path,
|
|
|
5 |
from lmdeploy.messages import TurbomindEngineConfig
|
6 |
|
7 |
backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05, model_format='awq')
|
8 |
+
model_path = 'internlm/internlm2_5-7b-chat-4bit'
|
9 |
|
10 |
InterFace.async_engine = AsyncEngine(
|
11 |
model_path=model_path,
|