Quentin Fisch commited on
Commit
5327a62
1 Parent(s): efb5688

feat(model): try mixtral-8x22b-instruct-v0.1

Browse files
Files changed (1) hide show
  1. confluence_rag.py +5 -2
confluence_rag.py CHANGED
@@ -87,7 +87,8 @@ def store_vector(all_splits: List[str]) -> VectorStoreRetriever:
87
 
88
  # Use the HuggingFace distilbert-base-uncased model to embed the text
89
  embeddings_model_url = (
90
- "https://api-inference.huggingface.co/models/distilbert-base-uncased"
 
91
  )
92
 
93
  embeddings = HuggingFaceInferenceAPIEmbeddings(
@@ -138,13 +139,15 @@ def generate_rag_chain(retriever: VectorStoreRetriever = None) -> RunnableSequen
138
  """
139
  # Use the Mistral Free prototype API
140
  mistral_url = (
141
- "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2"
 
142
  )
143
 
144
  model_endpoint = HuggingFaceEndpoint(
145
  endpoint_url=mistral_url,
146
  huggingfacehub_api_token=HF_API_KEY,
147
  task="text2text-generation",
 
148
  )
149
 
150
  # Use a custom output parser
 
87
 
88
  # Use the HuggingFace distilbert-base-uncased model to embed the text
89
  embeddings_model_url = (
90
+ # "https://api-inference.huggingface.co/models/distilbert-base-uncased"
91
+ "https://api-inference.huggingface.co/models/Salesforce/SFR-Embedding-Mistral"
92
  )
93
 
94
  embeddings = HuggingFaceInferenceAPIEmbeddings(
 
139
  """
140
  # Use the Mistral Free prototype API
141
  mistral_url = (
142
+ # "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2"
143
+ "https://api-inference.huggingface.co/models/mistralai/Mixtral-8x22B-Instruct-v0.1"
144
  )
145
 
146
  model_endpoint = HuggingFaceEndpoint(
147
  endpoint_url=mistral_url,
148
  huggingfacehub_api_token=HF_API_KEY,
149
  task="text2text-generation",
150
+ max_new_tokens=1024
151
  )
152
 
153
  # Use a custom output parser