Spaces:
Paused
Paused
Upload main.py
Browse filesupdated backend to 13b
main.py
CHANGED
@@ -19,8 +19,11 @@ app = FastAPI(docs_url="/")
|
|
19 |
|
20 |
# pipe = pipeline(model="TheBloke/Llama-2-7B-GGML/llama-2-7b.ggmlv3.q4_0.bin")
|
21 |
|
22 |
-
model_name_or_path = "TheBloke/Llama-2-7B-GGUF"
|
23 |
-
model_basename = "llama-2-7b.Q4_0.gguf"
|
|
|
|
|
|
|
24 |
|
25 |
model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
|
26 |
|
|
|
19 |
|
20 |
# pipe = pipeline(model="TheBloke/Llama-2-7B-GGML/llama-2-7b.ggmlv3.q4_0.bin")
|
21 |
|
22 |
+
# model_name_or_path = "TheBloke/Llama-2-7B-GGUF"
|
23 |
+
# model_basename = "llama-2-7b.Q4_0.gguf"
|
24 |
+
|
25 |
+
model_name_or_path = "Llama-2-13B-GGUF"
|
26 |
+
model_basename = "llama-2-13b.Q3_K_S.gguf"
|
27 |
|
28 |
model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
|
29 |
|