Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -564,11 +564,11 @@ class EnhancedGazaRAGSystem:
|
|
| 564 |
# Enhanced quantization configuration
|
| 565 |
quantization_config = BitsAndBytesConfig(
|
| 566 |
load_in_4bit=True,
|
| 567 |
-
bnb_4bit_compute_dtype=torch.float16,
|
| 568 |
bnb_4bit_use_double_quant=True,
|
| 569 |
bnb_4bit_quant_type="nf4",
|
| 570 |
-
|
| 571 |
)
|
|
|
|
| 572 |
|
| 573 |
self.tokenizer = AutoTokenizer.from_pretrained(
|
| 574 |
model_name,
|
|
|
|
| 564 |
# Enhanced quantization configuration
|
| 565 |
quantization_config = BitsAndBytesConfig(
|
| 566 |
load_in_4bit=True,
|
|
|
|
| 567 |
bnb_4bit_use_double_quant=True,
|
| 568 |
bnb_4bit_quant_type="nf4",
|
| 569 |
+
bnb_4bit_compute_dtype=torch.float16,
|
| 570 |
)
|
| 571 |
+
|
| 572 |
|
| 573 |
self.tokenizer = AutoTokenizer.from_pretrained(
|
| 574 |
model_name,
|