lrl-modelcloud
commited on
Commit
•
7895993
1
Parent(s):
315de09
Update README.md
Browse files
README.md
CHANGED
@@ -46,8 +46,8 @@ This model has been quantized using [GPTQModel](https://github.com/ModelCloud/GP
|
|
46 |
from transformers import AutoTokenizer
|
47 |
from gptqmodel import GPTQModel
|
48 |
|
49 |
-
tokenizer = AutoTokenizer.from_pretrained("ModelCloud/QwQ-32B-Preview-
|
50 |
-
model = GPTQModel.load("ModelCloud/QwQ-32B-Preview-
|
51 |
|
52 |
messages = [
|
53 |
{"role": "system", "content": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant."},
|
|
|
46 |
from transformers import AutoTokenizer
|
47 |
from gptqmodel import GPTQModel
|
48 |
|
49 |
+
tokenizer = AutoTokenizer.from_pretrained("ModelCloud/QwQ-32B-Preview-gptqmodel-4bit-vortex-v1")
|
50 |
+
model = GPTQModel.load("ModelCloud/QwQ-32B-Preview-gptqmodel-4bit-vortex-v1")
|
51 |
|
52 |
messages = [
|
53 |
{"role": "system", "content": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant."},
|