vilarin commited on
Commit
8716f81
1 Parent(s): 957cbfc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -7
app.py CHANGED
@@ -16,13 +16,9 @@ MODEL_FILE = "gemma-2-27b-it-Q4_K_M.gguf"
16
 
17
  os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
18
 
19
- llm = Llama(
20
- model_path=hf_hub_download(
21
- repo_id=REPO_ID,
22
- filename=MODEL_FILE,
23
- ),
24
- n_ctx=4096,
25
- n_gpu_layers=-1,
26
  tokenizer=llama_cpp.llama_tokenizer.LlamaHFTokenizer.from_pretrained(MODEL_ID),
27
  verbose=False,
28
  )
 
16
 
17
  os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
18
 
19
+ llm = llama_cpp.Llama.from_pretrained(
20
+ repo_id=REPO_ID,
21
+ filename=MODEL_FILE,
 
 
 
 
22
  tokenizer=llama_cpp.llama_tokenizer.LlamaHFTokenizer.from_pretrained(MODEL_ID),
23
  verbose=False,
24
  )