Update app.py
Browse files
app.py
CHANGED
|
@@ -22,7 +22,7 @@ metadata = pickle.load(open("metadata.pkl", "rb"))
|
|
| 22 |
# Load Hugging Face LLM (CPU-friendly)
|
| 23 |
# -----------------------------
|
| 24 |
# Small model for HF Spaces CPU limits
|
| 25 |
-
model_name = "TheBloke/vicuna-
|
| 26 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 27 |
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto") # Hugging Face will manage CPU/GPU
|
| 28 |
generator = pipeline("text-generation", model=model, tokenizer=tokenizer, max_length=200)
|
|
|
|
| 22 |
# Load Hugging Face LLM (CPU-friendly)
|
| 23 |
# -----------------------------
|
| 24 |
# Small model for HF Spaces CPU limits
|
| 25 |
+
model_name = "TheBloke/vicuna-3B-1.1-HF" # You can replace with a smaller model if needed
|
| 26 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 27 |
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto") # Hugging Face will manage CPU/GPU
|
| 28 |
generator = pipeline("text-generation", model=model, tokenizer=tokenizer, max_length=200)
|