ccm's picture
Ok maybe lets not use nonthinking mode for agents
1a514b0
raw
history blame
413 Bytes
# Chat-UI talks to the local proxy:
OPENAI_BASE_URL=http://127.0.0.1:8000/v1/
# The proxy forwards here (your HF endpoint):
UPSTREAM_OPENAI_BASE=https://ay8ts6hfrqidjvwt.us-east-1.aws.endpoints.huggingface.cloud/v1
# Models used by the proxy:
MODEL_NAME="Qwen/Qwen3-1.7B"
AGENT_MODEL="Qwen/Qwen3-1.7B"
TASK_MODEL="Qwen/Qwen3-1.7B-nothink"
PUBLIC_APP_NAME="Agent Examples"
MONGODB_URL=mongodb://127.0.0.1:27017