long1111 commited on
Commit
037c45d
1 Parent(s): cbdd2e9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -1,6 +1,6 @@
1
  from transformers import AutoTokenizer, AutoModel
2
  tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
3
- model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
4
  response, history = model.chat(tokenizer, "你好", history=[])
5
  print(response)
6
  response, history = model.chat(tokenizer, "晚上睡不着应该怎么办", history=history)
 
1
  from transformers import AutoTokenizer, AutoModel
2
  tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
3
+ model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().quantize(4).cuda()
4
  response, history = model.chat(tokenizer, "你好", history=[])
5
  print(response)
6
  response, history = model.chat(tokenizer, "晚上睡不着应该怎么办", history=history)