Spaces:
Sleeping
Sleeping
π§ νκ²½ λ³μ μ€μ κ°μ΄λ
π λ‘컬 κ°λ° νκ²½
.env νμΌ μ€μ
νλ‘μ νΈ λ£¨νΈμ .env νμΌμ μμ±νκ³ λ€μ λ³μλ€μ μ€μ νμΈμ:
# κΈ°λ³Έ μλ² μ€μ
HOST=0.0.0.0
PORT=8001
PYTHONPATH=/app
PYTHONUNBUFFERED=1
# νκ²½ κ°μ§
IS_LOCAL=true
ENVIRONMENT=local
DOCKER_ENV=local
# λͺ¨λΈ μ€μ
DEFAULT_MODEL=kanana-1.5-v-3b-instruct
MAX_NEW_TOKENS=256
TEMPERATURE=0.7
# λ‘컬 λͺ¨λΈ κ²½λ‘ (μ νμ¬ν)
LOCAL_MODEL_PATH=./lily_llm_core/models/kanana_1_5_v_3b_instruct
λ‘컬 Docker μ€ν
# λ‘컬 κ°λ°μ© Docker λΉλ
docker build -f Dockerfile.local -t lily-llm-local .
# λ‘컬 μ€ν (ν¬νΈ 8001)
docker run -p 8001:8001 --env-file .env lily-llm-local
βοΈ Hugging Face Spaces νκ²½
νμ νκ²½ λ³μ
Hugging Face Spaces Settings > Variablesμμ λ€μ λ³μλ€μ μ€μ νμΈμ:
κΈ°λ³Έ μλ² μ€μ
HOST=0.0.0.0
PORT=7860
PYTHONPATH=/app
PYTHONUNBUFFERED=1
Hugging Face μ€μ
# μΊμ λλ ν 리
TRANSFORMERS_CACHE=/app/cache/transformers
HF_HOME=/app/cache/huggingface
HF_HUB_CACHE=/app/cache/huggingface
# λͺ¨λΈ μ€μ
HF_MODEL_NAME=gbrabbit/lily-math-model
DEFAULT_MODEL=kanana-1.5-v-3b-instruct
# ν ν°ν λ³λ ¬ μ²λ¦¬ λΉνμ±ν (λ©λͺ¨λ¦¬ μ μ½)
TOKENIZERS_PARALLELISM=false
μ±λ₯ μ΅μ ν
# CPU μ€λ λ μ ν (λ©λͺ¨λ¦¬ μ μ½)
OMP_NUM_THREADS=1
MKL_NUM_THREADS=1
# PyTorch μ€μ
TORCH_HOME=/app/cache/torch
PYTORCH_TRANSFORMERS_CACHE=/app/cache/transformers
AI λͺ¨λΈ μ€μ
# μμ± νλΌλ―Έν°
MAX_NEW_TOKENS=256
TEMPERATURE=0.7
TOP_P=0.9
TOP_K=40
μ νμ νκ²½ λ³μ
λλ²κΉ
# λ‘κ·Έ λ 벨
LOG_LEVEL=INFO
DEBUG=false
# μμΈ λ‘κΉ
TRANSFORMERS_VERBOSITY=warning
HF_HUB_VERBOSITY=warning
보μ (νμμ)
# API ν€ (νμν κ²½μ°)
HF_TOKEN=your_huggingface_token
API_SECRET_KEY=your_secret_key
π μλ λͺ¨λΈ λ€μ΄λ‘λ λμ λ°©μ
1λ¨κ³: λ‘컬 λͺ¨λΈ νμΈ
/app/lily_llm_core/models/kanana_1_5_v_3b_instruct/κ²½λ‘ νμΈ- νμΌμ΄ μμΌλ©΄ λ‘컬 λͺ¨λΈ μ¬μ©
2λ¨κ³: Hugging Face Hub λ€μ΄λ‘λ
- λ‘컬 λͺ¨λΈμ΄ μμΌλ©΄
gbrabbit/lily-math-modelμμ μλ λ€μ΄λ‘λ /app/cache/transformers/κ²½λ‘μ μΊμ μ μ₯
3λ¨κ³: λͺ¨λΈ λ‘λ©
- μΊμλ λͺ¨λΈμ λ©λͺ¨λ¦¬μ λ‘λ
- μλ² μμ μλ£
π μμ λμ
첫 λ²μ§Έ λ°°ν¬
π Hugging Face Hubμμ λ€μ΄λ‘λ: gbrabbit/lily-math-model
π₯ λͺ¨λΈ λ€μ΄λ‘λ μ€... (μ½ 2-5λΆ)
β
λͺ¨λΈ λ‘λ μλ£
π μλ² μμ: 0.0.0.0:7860
μ΄ν μ¬μμ
ποΈ μΊμλ λͺ¨λΈ μ¬μ©: /app/cache/transformers/
β
λͺ¨λΈ λ‘λ μλ£ (μ½ 30μ΄)
π μλ² μμ: 0.0.0.0:7860
π λ¬Έμ ν΄κ²°
λͺ¨λΈ λ€μ΄λ‘λ μ€ν¨
# λ€νΈμν¬ μ°κ²° νμΈ
curl -I https://huggingface.co/gbrabbit/lily-math-model
# Hugging Face Hub μν νμΈ
curl -I https://huggingface.co/api/models/gbrabbit/lily-math-model
λ©λͺ¨λ¦¬ λΆμ‘±
# λ μμ λͺ¨λΈ μ¬μ© λλ μμν μ μ©
# Hardware μ
κ·Έλ μ΄λ κ³ λ € (CPU upgrade λλ GPU)
μΊμ λ¬Έμ
# μΊμ λλ ν 리 κΆν νμΈ
ls -la /app/cache/
# μΊμ μμ ν μ¬μμ
rm -rf /app/cache/transformers/*