themissingCRAM
commited on
Commit
·
44a16d6
1
Parent(s):
8cfe61b
unsloth bnb 4bits
Browse files
app.py
CHANGED
|
@@ -161,7 +161,7 @@ if __name__ == "__main__":
|
|
| 161 |
model = TransformersModel(
|
| 162 |
# model_id="Qwen/Qwen2.5-Coder-14B-Instruct",
|
| 163 |
# model_id="unsloth/Llama-3.2-3B-Instruct-unsloth-bnb-4bit",
|
| 164 |
-
model_id = "
|
| 165 |
device_map="cuda"
|
| 166 |
)
|
| 167 |
# model = HfApiModel(
|
|
|
|
| 161 |
model = TransformersModel(
|
| 162 |
# model_id="Qwen/Qwen2.5-Coder-14B-Instruct",
|
| 163 |
# model_id="unsloth/Llama-3.2-3B-Instruct-unsloth-bnb-4bit",
|
| 164 |
+
model_id = "neuralmagic/Llama-3.2-3B-Instruct-FP8",
|
| 165 |
device_map="cuda"
|
| 166 |
)
|
| 167 |
# model = HfApiModel(
|