Spaces:
Running on Zero
Running on Zero
Upload app.py
Browse files
app.py
CHANGED
|
@@ -87,7 +87,6 @@ def start_vllm_service() -> bool:
|
|
| 87 |
VLLM_PROCESS = subprocess.Popen(
|
| 88 |
[
|
| 89 |
"vllm", "serve", VLLM_MODEL_NAME,
|
| 90 |
-
"--port", str(VLLM_PORT),
|
| 91 |
"--host", VLLM_HOST,
|
| 92 |
"--tensor-parallel-size", "1",
|
| 93 |
"--gpu-memory-utilization", "0.95"
|
|
|
|
| 87 |
VLLM_PROCESS = subprocess.Popen(
|
| 88 |
[
|
| 89 |
"vllm", "serve", VLLM_MODEL_NAME,
|
|
|
|
| 90 |
"--host", VLLM_HOST,
|
| 91 |
"--tensor-parallel-size", "1",
|
| 92 |
"--gpu-memory-utilization", "0.95"
|