rivapereira123 commited on
Commit
0f5217f
·
verified ·
1 Parent(s): 0c2c20e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -564,11 +564,11 @@ class EnhancedGazaRAGSystem:
564
  # Enhanced quantization configuration
565
  quantization_config = BitsAndBytesConfig(
566
  load_in_4bit=True,
567
- bnb_4bit_compute_dtype=torch.float16,
568
  bnb_4bit_use_double_quant=True,
569
  bnb_4bit_quant_type="nf4",
570
- bnb_4bit_quant_storage=torch.uint8
571
  )
 
572
 
573
  self.tokenizer = AutoTokenizer.from_pretrained(
574
  model_name,
 
564
  # Enhanced quantization configuration
565
  quantization_config = BitsAndBytesConfig(
566
  load_in_4bit=True,
 
567
  bnb_4bit_use_double_quant=True,
568
  bnb_4bit_quant_type="nf4",
569
+ bnb_4bit_compute_dtype=torch.float16,
570
  )
571
+
572
 
573
  self.tokenizer = AutoTokenizer.from_pretrained(
574
  model_name,