clemparpa commited on
Commit
73d33c9
1 Parent(s): f65697c

removed to.cuda in 4bit

Browse files
Files changed (1) hide show
  1. handler.py +3 -2
handler.py CHANGED
@@ -27,9 +27,10 @@ class EndpointHandler():
27
  self.model = AutoModelForCausalLM.from_pretrained(
28
  path,
29
  temperature=0,
30
- torch_dtype = self.dtype,
31
  load_in_4bit = self.load_in_4bit,
32
- ).to("cuda")
 
33
 
34
  self.tokenizer = AutoTokenizer.from_pretrained(path)
35
  self.tokenizer.padding_side="left"
 
27
  self.model = AutoModelForCausalLM.from_pretrained(
28
  path,
29
  temperature=0,
30
+ # torch_dtype = self.dtype,
31
  load_in_4bit = self.load_in_4bit,
32
+ )
33
+ # .to("cuda")
34
 
35
  self.tokenizer = AutoTokenizer.from_pretrained(path)
36
  self.tokenizer.padding_side="left"