TI_RAG_Demo_L3.1

Runtime error

arjunanand13 commited on May 27, 2024

Commit

ba1cc0a

•

1 Parent(s): 7d15343

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -22,7 +22,8 @@ class StopOnTokens(StoppingCriteria):
 # Load the LLaMA model and tokenizer
 # model_id = 'meta-llama/Meta-Llama-3-8B-Instruct'
-model_id= "meta-llama/Llama-2-7b-chat-hf"
 device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
 # Set quantization configuration

 # Load the LLaMA model and tokenizer
 # model_id = 'meta-llama/Meta-Llama-3-8B-Instruct'
+# model_id= "meta-llama/Llama-2-7b-chat-hf"
+model_id="mistralai/Mistral-7B-Instruct-v0.2"
 device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
 # Set quantization configuration