neural-mesh / test /run_single_problem.sh
hjkim00's picture
Upload TestTime-RLVR-v2 from Full-pipeline-relative_0827 branch
f50dc54 verified
#!/bin/bash
# νŠΉμ • λ¬Έμ œμ— λŒ€ν•΄ TTRLVR + AZR 톡합 ν•™μŠ΅ μ‹€ν–‰
# κΈ°λ³Έ μ„€μ •
GPU_ID=${1:-5}
PROBLEM_ID=${2:-"Mbpp/7"}
ROUNDS=${3:-3}
# ν™˜κ²½ λ³€μˆ˜ μ„€μ •
export CUDA_VISIBLE_DEVICES=$GPU_ID
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export RAY_memory_monitor_refresh_ms=0
export RAY_LOGGING_LEVEL=DEBUG
export HYDRA_FULL_ERROR=1
export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2"
# 둜그 디렉토리
LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs"
mkdir -p $LOG_DIR
# νƒ€μž„μŠ€νƒ¬ν”„
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
SAFE_PROBLEM_ID=$(echo $PROBLEM_ID | tr '/' '_')
LOG_FILE="$LOG_DIR/single_problem_${SAFE_PROBLEM_ID}_${TIMESTAMP}.log"
echo "🎯 νŠΉμ • 문제 ν•™μŠ΅ μ‹œμž‘"
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
echo "πŸ“Œ 문제 ID: $PROBLEM_ID"
echo "πŸ”„ λΌμš΄λ“œ 수: $ROUNDS"
echo "πŸ–₯️ GPU: $GPU_ID"
echo "πŸ“ 둜그 파일: $LOG_FILE"
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
echo ""
# train_ttrlvr_azr.py μ‹€ν–‰
python /home/ubuntu/RLVR/TestTime-RLVR-v2/test/train_ttrlvr_azr.py \
--benchmark mbpp \
--problem-id "$PROBLEM_ID" \
--rounds $ROUNDS \
--gpu $GPU_ID \
--model "Qwen/Qwen2.5-7B" \
2>&1 | tee $LOG_FILE
echo ""
echo "βœ… ν•™μŠ΅ μ™„λ£Œ. 둜그 확인: $LOG_FILE"