Romain Cosentino commited on
Commit
81ce442
1 Parent(s): 5cfeb50

Update app.py

Browse files

changing 4bits to bfloat

Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -29,7 +29,7 @@ if not torch.cuda.is_available():
29
 
30
  if torch.cuda.is_available():
31
  model_id = "tenyx/TenyxChat-7B-v1"
32
- model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", load_in_4bit=True)
33
  tokenizer = AutoTokenizer.from_pretrained(model_id)
34
  tokenizer.use_default_system_prompt = False
35
 
 
29
 
30
  if torch.cuda.is_available():
31
  model_id = "tenyx/TenyxChat-7B-v1"
32
+ model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", torch_dtype=torch.bfloat16)
33
  tokenizer = AutoTokenizer.from_pretrained(model_id)
34
  tokenizer.use_default_system_prompt = False
35