shideqin commited on
Commit
617bcb0
1 Parent(s): c63d66d

add use-cpu

Browse files
Files changed (1) hide show
  1. app.py +5 -1
app.py CHANGED
@@ -1,8 +1,12 @@
1
  from transformers import AutoModel, AutoTokenizer
2
  import gradio as gr
3
 
 
4
  tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
5
- model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
 
 
 
6
  model = model.eval()
7
 
8
  def predict(input, history=None):
 
1
  from transformers import AutoModel, AutoTokenizer
2
  import gradio as gr
3
 
4
+ use_cpu = os.environ.get("USE_CPU", "all")
5
  tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
6
+ if not use_cpu:
7
+ model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
8
+ else:
9
+ model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).float()
10
  model = model.eval()
11
 
12
  def predict(input, history=None):