arjunanand13 commited on
Commit
ba1cc0a
1 Parent(s): 7d15343

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -22,7 +22,8 @@ class StopOnTokens(StoppingCriteria):
22
 
23
  # Load the LLaMA model and tokenizer
24
  # model_id = 'meta-llama/Meta-Llama-3-8B-Instruct'
25
- model_id= "meta-llama/Llama-2-7b-chat-hf"
 
26
  device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
27
 
28
  # Set quantization configuration
 
22
 
23
  # Load the LLaMA model and tokenizer
24
  # model_id = 'meta-llama/Meta-Llama-3-8B-Instruct'
25
+ # model_id= "meta-llama/Llama-2-7b-chat-hf"
26
+ model_id="mistralai/Mistral-7B-Instruct-v0.2"
27
  device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
28
 
29
  # Set quantization configuration