removed to.cuda in 4bit
Browse files- handler.py +3 -2
handler.py
CHANGED
@@ -27,9 +27,10 @@ class EndpointHandler():
|
|
27 |
self.model = AutoModelForCausalLM.from_pretrained(
|
28 |
path,
|
29 |
temperature=0,
|
30 |
-
torch_dtype = self.dtype,
|
31 |
load_in_4bit = self.load_in_4bit,
|
32 |
-
)
|
|
|
33 |
|
34 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
35 |
self.tokenizer.padding_side="left"
|
|
|
27 |
self.model = AutoModelForCausalLM.from_pretrained(
|
28 |
path,
|
29 |
temperature=0,
|
30 |
+
# torch_dtype = self.dtype,
|
31 |
load_in_4bit = self.load_in_4bit,
|
32 |
+
)
|
33 |
+
# .to("cuda")
|
34 |
|
35 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
36 |
self.tokenizer.padding_side="left"
|