iofu728 commited on
Commit
c67fd6f
1 Parent(s): 7b75ee1

Feature(MInference): add dtype

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -57,7 +57,7 @@ h1 {
57
  # Load the tokenizer and model
58
  model_name = "gradientai/Llama-3-8B-Instruct-262k"
59
  tokenizer = AutoTokenizer.from_pretrained(model_name)
60
- model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto") # to("cuda:0")
61
 
62
  from minference import MInference
63
  minference_patch = MInference("minference", model_name)
 
57
  # Load the tokenizer and model
58
  model_name = "gradientai/Llama-3-8B-Instruct-262k"
59
  tokenizer = AutoTokenizer.from_pretrained(model_name)
60
+ model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto") # to("cuda:0")
61
 
62
  from minference import MInference
63
  minference_patch = MInference("minference", model_name)