lily_fast_api / deploy_gpu_huggingface.sh
gbrabbit's picture
Fresh start for HF Spaces deployment
526927a
raw
history blame
2.56 kB
#!/bin/bash
# Hugging Face GPU ๋ฐฐํฌ ์Šคํฌ๋ฆฝํŠธ
echo "๐Ÿš€ Hugging Face GPU ํ™˜๊ฒฝ ๋ฐฐํฌ ์‹œ์ž‘"
# GPU ํ™˜๊ฒฝ ํ™•์ธ
echo "๐Ÿ” GPU ํ™˜๊ฒฝ ํ™•์ธ ์ค‘..."
python check_gpu_environment.py
if [ $? -ne 0 ]; then
echo "โŒ GPU ํ™˜๊ฒฝ ํ™•์ธ ์‹คํŒจ"
exit 1
fi
# Hugging Face ์„ค์ •
echo "๐Ÿ”ง Hugging Face ํ™˜๊ฒฝ ์„ค์ • ์ค‘..."
python huggingface_gpu_setup.py
# ๊ธฐ์กด ์ปจํ…Œ์ด๋„ˆ ์ •๋ฆฌ
echo "๐Ÿงน ๊ธฐ์กด ์ปจํ…Œ์ด๋„ˆ ์ •๋ฆฌ ์ค‘..."
docker-compose -f docker-compose.gpu.yml down --volumes --remove-orphans
# GPU ๋ฉ”๋ชจ๋ฆฌ ์ •๋ฆฌ
echo "๐Ÿ’พ GPU ๋ฉ”๋ชจ๋ฆฌ ์ •๋ฆฌ ์ค‘..."
nvidia-smi --gpu-reset
# ์ด๋ฏธ์ง€ ๋นŒ๋“œ
echo "๐Ÿ”จ Docker ์ด๋ฏธ์ง€ ๋นŒ๋“œ ์ค‘..."
docker-compose -f docker-compose.gpu.yml build --no-cache
# ์ปจํ…Œ์ด๋„ˆ ์‹œ์ž‘
echo "๐Ÿš€ ์ปจํ…Œ์ด๋„ˆ ์‹œ์ž‘ ์ค‘..."
docker-compose -f docker-compose.gpu.yml up -d
# ์„œ๋น„์Šค ์ƒํƒœ ํ™•์ธ
echo "๐Ÿ“Š ์„œ๋น„์Šค ์ƒํƒœ ํ™•์ธ ์ค‘..."
sleep 15
# ํ—ฌ์Šค์ฒดํฌ
echo "๐Ÿฅ ํ—ฌ์Šค์ฒดํฌ ์ค‘..."
for i in {1..30}; do
if curl -f http://localhost:8001/health &> /dev/null; then
echo "โœ… Lily LLM API ์„œ๋น„์Šค ์ •์ƒ"
break
fi
if [ $i -eq 30 ]; then
echo "โŒ ์„œ๋น„์Šค ์‹œ์ž‘ ์‹คํŒจ"
docker-compose -f docker-compose.gpu.yml logs
exit 1
fi
echo "โณ ์„œ๋น„์Šค ์‹œ์ž‘ ๋Œ€๊ธฐ ์ค‘... ($i/30)"
sleep 2
done
# GPU ์‚ฌ์šฉ๋Ÿ‰ ํ™•์ธ
echo "๐ŸŽฎ GPU ์‚ฌ์šฉ๋Ÿ‰ ํ™•์ธ:"
nvidia-smi
# Hugging Face ๋ชจ๋ธ ํ…Œ์ŠคํŠธ
echo "๐Ÿงช Hugging Face ๋ชจ๋ธ ํ…Œ์ŠคํŠธ ์ค‘..."
python test_gpu_deployment.py
# ์„ฑ๋Šฅ ์ตœ์ ํ™” ์ ์šฉ
echo "โšก ์„ฑ๋Šฅ ์ตœ์ ํ™” ์ ์šฉ ์ค‘..."
python performance_optimization.py
# ์„œ๋น„์Šค ์ •๋ณด ์ถœ๋ ฅ
echo ""
echo "๐ŸŽ‰ Hugging Face GPU ํ™˜๊ฒฝ ๋ฐฐํฌ ์™„๋ฃŒ!"
echo ""
echo "๐Ÿ“‹ ์„œ๋น„์Šค ์ •๋ณด:"
echo " - Lily LLM API: http://localhost:8001"
echo " - Hearth Chat: http://localhost:8000"
echo " - LaTeX-OCR Service: ๋ณ„๋„ ์ปจํ…Œ์ด๋„ˆ๋กœ ์‹คํ–‰ ์ค‘"
echo ""
echo "๐Ÿ”ง ์œ ์šฉํ•œ ๋ช…๋ น์–ด:"
echo " - ๋กœ๊ทธ ํ™•์ธ: docker-compose -f docker-compose.gpu.yml logs -f"
echo " - ์„œ๋น„์Šค ์ค‘์ง€: docker-compose -f docker-compose.gpu.yml down"
echo " - ์„œ๋น„์Šค ์žฌ์‹œ์ž‘: docker-compose -f docker-compose.gpu.yml restart"
echo ""
echo "๐Ÿงช ํ…Œ์ŠคํŠธ ๋ช…๋ น์–ด:"
echo " - API ํ…Œ์ŠคํŠธ: curl http://localhost:8001/health"
echo " - GPU ํ…Œ์ŠคํŠธ: python test_gpu_deployment.py"
echo " - Hugging Face ํ…Œ์ŠคํŠธ: python huggingface_gpu_setup.py"
echo ""
echo "๐Ÿ’ก Hugging Face ๋ชจ๋ธ ์‚ฌ์šฉ:"
echo " - ๋ชจ๋ธ ๋กœ๋“œ: python huggingface_gpu_setup.py"
echo " - ํ† ํฐ ์„ค์ •: huggingface-cli login"