Spaces:
Sleeping
Sleeping
| # Audit QA Configuration | |
| # Converted from model_params.cfg to YAML format | |
| qdrant: | |
| # url: "http://10.1.4.192:8803"` | |
| url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io" | |
| collection_name: "docling" | |
| prefer_grpc: true | |
| api_key: "${QDRANT_API_KEY}" # Load from environment variable | |
| retriever: | |
| model: "BAAI/bge-m3" | |
| normalize: true | |
| top_k: 20 | |
| retrieval: | |
| use_reranking: true | |
| reranker_model: "BAAI/bge-reranker-v2-m3" | |
| reranker_top_k: 5 | |
| ranker: | |
| model: "BAAI/bge-reranker-v2-m3" | |
| top_k: 5 | |
| bm25: | |
| top_k: 20 | |
| hybrid: | |
| default_mode: "vector_only" # Options: vector_only, sparse_only, hybrid | |
| default_alpha: 0.5 # Weight for vector scores (0.5 = equal weight) | |
| reader: | |
| default_type: "OPENAI" | |
| max_tokens: 768 | |
| # Different LLM provider configurations | |
| INF_PROVIDERS: | |
| model: "meta-llama/Llama-3.1-8B-Instruct" | |
| provider: "nebius" | |
| # Not working | |
| NVIDIA: | |
| model: "meta-llama/Llama-3.1-8B-Instruct" | |
| endpoint: "https://huggingface.co/api/integrations/dgx/v1" | |
| # Not working | |
| DEDICATED: | |
| model: "meta-llama/Llama-3.1-8B-Instruct" | |
| endpoint: "https://qu2d8m6dmsollhly.us-east-1.aws.endpoints.huggingface.cloud" | |
| MISTRAL: | |
| model: "mistral-medium-latest" | |
| OPENAI: | |
| model: "gpt-4o-mini" | |
| OLLAMA: | |
| model: "mistral-small3.1:24b-instruct-2503-q8_0" | |
| base_url: "http://10.1.4.192:11434/" | |
| temperature: 0.8 | |
| num_predict: 256 | |
| OPENROUTER: | |
| model: "moonshotai/kimi-k2:free" | |
| base_url: "https://openrouter.ai/api/v1" | |
| temperature: 0.7 | |
| max_tokens: 1000 | |
| # site_url: "https://your-site.com" # optional, for OpenRouter ranking | |
| # site_name: "Your Site Name" # optional, for OpenRouter ranking | |
| app: | |
| dropdown_default: "Annual Consolidated OAG 2024" | |
| # File paths | |
| paths: | |
| chunks_file: "reports/docling_chunks.json" | |
| reports_dir: "reports" | |
| # Feature toggles | |
| features: | |
| enable_session: true | |
| enable_logging: true | |
| # Logging and HuggingFace scheduler configuration | |
| logging: | |
| json_dataset_dir: "json_dataset" | |
| huggingface: | |
| repo_id: "GIZ/spaces_logs" | |
| repo_type: "dataset" | |
| folder_path: "json_dataset" | |
| path_in_repo: "audit_chatbot" | |
| token_env_var: "SPACES_LOG" | |