m97j's picture
Initial commit
5fc69e4
raw
history blame
930 Bytes
import os
# Hugging Face Spaces serve URL (๊ณต๊ฐœ ์„ค์ •์ด๋ฏ€๋กœ ์ง์ ‘ ์ฃผ์†Œ ์‚ฌ์šฉ ๊ฐ€๋Šฅ)
HF_SERVE_URL = os.getenv(
"HF_SERVE_URL",
"https://m97j-PersonaChatEngine.hf.space"
)
# ์š”์ฒญ ํƒ€์ž„์•„์›ƒ (์ดˆ ๋‹จ์œ„)
HF_TIMEOUT = float(os.getenv("HF_TIMEOUT", "25"))
# RAG ํ•ญ์ƒ ์‚ฌ์šฉ (ํ† ๊ธ€์ด ์•„๋‹ˆ๋ผ ๊ณ ์ • ์‚ฌ์šฉ)
RAG_ENABLED = True
# ์ƒ์„ฑ ํŒŒ๋ผ๋ฏธํ„ฐ ๊ธฐ๋ณธ๊ฐ’ (์š”์ฒญ๋งˆ๋‹ค override ๊ฐ€๋Šฅ)
GENERATION_CONFIG = {
"max_new_tokens": int(os.getenv("GEN_MAX_NEW_TOKENS", "220")),
"temperature": float(os.getenv("GEN_TEMPERATURE", "0.7")),
"top_p": float(os.getenv("GEN_TOP_P", "0.9")),
"repetition_penalty": float(os.getenv("GEN_REPETITION_PENALTY", "1.1")),
"do_sample": True
}
'''
# ๋ชจ๋ธ ์ •๋ณด (์ถ”ํ›„ ํ™•์žฅ ๊ฐ€๋Šฅ)
MODEL_INFO = {
"base_model": "meta-llama/Meta-Llama-3-8B",
"adapter": "m97j/PersonaAdapter-v1",
"serve_mode": "hf_spaces", # ๋˜๋Š” "local", "api"
}
'''