minhdang commited on
Commit
659b257
1 Parent(s): ca96c4f

Update inference.py

Browse files
Files changed (1) hide show
  1. inference.py +0 -1
inference.py CHANGED
@@ -37,7 +37,6 @@ from transformers import BitsAndBytesConfig
37
 
38
  nf8_config = BitsAndBytesConfig(
39
  load_in_8bit=True,
40
- bnb_8bit_use_double_quant=True,
41
  bnb_8bit_quant_type="nf8",
42
  )
43
  def load_model(model_path):
 
37
 
38
  nf8_config = BitsAndBytesConfig(
39
  load_in_8bit=True,
 
40
  bnb_8bit_quant_type="nf8",
41
  )
42
  def load_model(model_path):