themissingCRAM
commited on
Commit
·
8cfe61b
1
Parent(s):
69286ea
unsloth bnb 4bits
Browse files
app.py
CHANGED
|
@@ -160,10 +160,10 @@ if __name__ == "__main__":
|
|
| 160 |
# you can use HFApiModel from smolagents if you don't mind paying more money.
|
| 161 |
model = TransformersModel(
|
| 162 |
# model_id="Qwen/Qwen2.5-Coder-14B-Instruct",
|
| 163 |
-
model_id="unsloth/Llama-3.2-3B-Instruct-unsloth-bnb-4bit",
|
|
|
|
| 164 |
device_map="cuda"
|
| 165 |
)
|
| 166 |
-
model.model.to("cuda")
|
| 167 |
# model = HfApiModel(
|
| 168 |
# model_id="meta-llama/Meta-Llama-3.1-8B-Instruct",
|
| 169 |
# token = os.getenv("bakery_multi_agents_hf_tokens_write")
|
|
|
|
| 160 |
# you can use HFApiModel from smolagents if you don't mind paying more money.
|
| 161 |
model = TransformersModel(
|
| 162 |
# model_id="Qwen/Qwen2.5-Coder-14B-Instruct",
|
| 163 |
+
# model_id="unsloth/Llama-3.2-3B-Instruct-unsloth-bnb-4bit",
|
| 164 |
+
model_id = "MaziyarPanahi/Llama-3.2-3B-Instruct-GGUF",
|
| 165 |
device_map="cuda"
|
| 166 |
)
|
|
|
|
| 167 |
# model = HfApiModel(
|
| 168 |
# model_id="meta-llama/Meta-Llama-3.1-8B-Instruct",
|
| 169 |
# token = os.getenv("bakery_multi_agents_hf_tokens_write")
|