CoderCowMoo commited on
Commit
125b498
β€’
1 Parent(s): 5e96c36

No device, and cuda in the spaces function?

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -16,7 +16,6 @@ tokenizer = AutoTokenizer.from_pretrained(model_id)
16
  quantize_config = BaseQuantizeConfig(
17
  bits=4,
18
  group_size=128,
19
- device_map="auto",
20
  desc_act=False
21
  )
22
  model = AutoGPTQForCausalLM.from_quantized(
@@ -46,7 +45,7 @@ def respond(
46
 
47
  response = ""
48
 
49
- inputs = tokenizer.apply_chat_template(messages, return_tensors="pt")
50
  streamer = TextIteratorStreamer(tokenizer, skip_special_tokens=True, skip_prompt=True)
51
 
52
  thread = Thread(
 
16
  quantize_config = BaseQuantizeConfig(
17
  bits=4,
18
  group_size=128,
 
19
  desc_act=False
20
  )
21
  model = AutoGPTQForCausalLM.from_quantized(
 
45
 
46
  response = ""
47
 
48
+ inputs = tokenizer.apply_chat_template(messages, return_tensors="pt").to(device=torch.device("cuda"))
49
  streamer = TextIteratorStreamer(tokenizer, skip_special_tokens=True, skip_prompt=True)
50
 
51
  thread = Thread(