sithumonline commited on
Commit
6b33574
1 Parent(s): eb0271e

Check model to phi-3

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -7,8 +7,8 @@ from huggingface_hub import hf_hub_download
7
 
8
  llm = Llama(
9
  model_path=hf_hub_download(
10
- repo_id=os.environ.get("REPO_ID", "TheBloke/Llama-2-7b-Chat-GGUF"),
11
- filename=os.environ.get("MODEL_FILE", "llama-2-7b-chat.Q5_0.gguf"),
12
  ),
13
  n_ctx=2048,
14
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
@@ -82,3 +82,4 @@ demo = gr.ChatInterface(
82
 
83
  if __name__ == "__main__":
84
  demo.launch()
 
 
7
 
8
  llm = Llama(
9
  model_path=hf_hub_download(
10
+ repo_id=os.environ.get("REPO_ID", "microsoft/Phi-3-mini-4k-instruct-gguf"),
11
+ filename=os.environ.get("MODEL_FILE", "Phi-3-mini-4k-instruct-q4.gguf"),
12
  ),
13
  n_ctx=2048,
14
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
 
82
 
83
  if __name__ == "__main__":
84
  demo.launch()
85
+