audit_assistant / src /config /settings.yaml
akryldigital's picture
Pilot (#2)
92633a7 verified
raw
history blame
2.2 kB
# Audit QA Configuration
# Converted from model_params.cfg to YAML format
qdrant:
# url: "http://10.1.4.192:8803"`
url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io"
collection_name: "docling"
prefer_grpc: true
api_key: "${QDRANT_API_KEY}" # Load from environment variable
retriever:
model: "BAAI/bge-m3"
normalize: true
top_k: 20
retrieval:
use_reranking: true
reranker_model: "BAAI/bge-reranker-v2-m3"
reranker_top_k: 5
ranker:
model: "BAAI/bge-reranker-v2-m3"
top_k: 5
bm25:
top_k: 20
hybrid:
default_mode: "vector_only" # Options: vector_only, sparse_only, hybrid
default_alpha: 0.5 # Weight for vector scores (0.5 = equal weight)
reader:
default_type: "OPENAI"
max_tokens: 768
# Different LLM provider configurations
INF_PROVIDERS:
model: "meta-llama/Llama-3.1-8B-Instruct"
provider: "nebius"
# Not working
NVIDIA:
model: "meta-llama/Llama-3.1-8B-Instruct"
endpoint: "https://huggingface.co/api/integrations/dgx/v1"
# Not working
DEDICATED:
model: "meta-llama/Llama-3.1-8B-Instruct"
endpoint: "https://qu2d8m6dmsollhly.us-east-1.aws.endpoints.huggingface.cloud"
MISTRAL:
model: "mistral-medium-latest"
OPENAI:
model: "gpt-4o-mini"
OLLAMA:
model: "mistral-small3.1:24b-instruct-2503-q8_0"
base_url: "http://10.1.4.192:11434/"
temperature: 0.8
num_predict: 256
OPENROUTER:
model: "moonshotai/kimi-k2:free"
base_url: "https://openrouter.ai/api/v1"
temperature: 0.7
max_tokens: 1000
# site_url: "https://your-site.com" # optional, for OpenRouter ranking
# site_name: "Your Site Name" # optional, for OpenRouter ranking
app:
dropdown_default: "Annual Consolidated OAG 2024"
# File paths
paths:
chunks_file: "reports/docling_chunks.json"
reports_dir: "reports"
# Feature toggles
features:
enable_session: true
enable_logging: true
# Logging and HuggingFace scheduler configuration
logging:
json_dataset_dir: "json_dataset"
huggingface:
repo_id: "GIZ/spaces_logs"
repo_type: "dataset"
folder_path: "json_dataset"
path_in_repo: "audit_chatbot"
token_env_var: "SPACES_LOG"