Spaces:
Running
on
Zero
Running
on
Zero
Feature(MInference): add dtype
Browse files
app.py
CHANGED
@@ -57,7 +57,7 @@ h1 {
|
|
57 |
# Load the tokenizer and model
|
58 |
model_name = "gradientai/Llama-3-8B-Instruct-262k"
|
59 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
60 |
-
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto") # to("cuda:0")
|
61 |
|
62 |
from minference import MInference
|
63 |
minference_patch = MInference("minference", model_name)
|
|
|
57 |
# Load the tokenizer and model
|
58 |
model_name = "gradientai/Llama-3-8B-Instruct-262k"
|
59 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
60 |
+
model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto") # to("cuda:0")
|
61 |
|
62 |
from minference import MInference
|
63 |
minference_patch = MInference("minference", model_name)
|