Update README.md
Browse files
README.md
CHANGED
@@ -55,9 +55,9 @@ output:你好!作为一个大型语言模型,我一直在学习和提高
|
|
55 |
```
|
56 |
|
57 |
|
58 |
-
##
|
59 |
-
```
|
60 |
-
llama2-chat-template.jinja file is chat-template above
|
61 |
model_path=Mistral-7B-Instruct-V0.4
|
62 |
python -m vllm.entrypoints.openai.api_server --model=$model_path \
|
63 |
--trust-remote-code --host 0.0.0.0 --port 7777 \
|
@@ -65,8 +65,8 @@ python -m vllm.entrypoints.openai.api_server --model=$model_path \
|
|
65 |
--max-model-len 8192 --chat-template llama2-chat-template.jinja \
|
66 |
--tensor-parallel-size 1 --served-model-name chatbot
|
67 |
```
|
68 |
-
```
|
69 |
|
|
|
70 |
from openai import OpenAI
|
71 |
# Set OpenAI's API key and API base to use vLLM's API server.
|
72 |
openai_api_key = "EMPTY"
|
|
|
55 |
```
|
56 |
|
57 |
|
58 |
+
## vLLM server
|
59 |
+
```shell
|
60 |
+
#llama2-chat-template.jinja file is chat-template above
|
61 |
model_path=Mistral-7B-Instruct-V0.4
|
62 |
python -m vllm.entrypoints.openai.api_server --model=$model_path \
|
63 |
--trust-remote-code --host 0.0.0.0 --port 7777 \
|
|
|
65 |
--max-model-len 8192 --chat-template llama2-chat-template.jinja \
|
66 |
--tensor-parallel-size 1 --served-model-name chatbot
|
67 |
```
|
|
|
68 |
|
69 |
+
```python
|
70 |
from openai import OpenAI
|
71 |
# Set OpenAI's API key and API base to use vLLM's API server.
|
72 |
openai_api_key = "EMPTY"
|