More_Advanced_Embeddings_Comparator

Running

Chris4K commited on Oct 22, 2024

Commit

9684173

verified ·

1 Parent(s): 12758a0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -807,6 +807,21 @@ def get_llm_suggested_settings(file, num_chunks=1):
 9. Whether to optimize vocabulary
 10. Whether to apply phonetic matching
 Text chunks:
 {' '.join(sample_chunks)}

 9. Whether to optimize vocabulary
 10. Whether to apply phonetic matching
+Expected output format:
+{{
+    "embedding_models": "embedding_model_type:embedding_model_name",
+    "split_strategy": "token or recursive",
+    "chunk_size": 250,
+    "overlap_size": 50,
+    "vector_store_type": "FAISS or Chroma",
+    "search_type": "similarity, mmr, or custom",
+    "top_k": 5,
+    "apply_preprocessing": True,
+    "optimize_vocab": True,
+    "apply_phonetic": False,
+    "phonetic_weight": 0.3  # Default value, as it's not in the LLM suggestions
+}}
 Text chunks:
 {' '.join(sample_chunks)}