|
#!/bin/bash |
|
|
|
|
|
|
|
GPU_ID=${1:-5} |
|
PROBLEM_ID=${2:-"Mbpp/7"} |
|
ROUNDS=${3:-3} |
|
|
|
|
|
export CUDA_VISIBLE_DEVICES=$GPU_ID |
|
export VLLM_ATTENTION_BACKEND=FLASH_ATTN |
|
export RAY_memory_monitor_refresh_ms=0 |
|
export RAY_LOGGING_LEVEL=DEBUG |
|
export HYDRA_FULL_ERROR=1 |
|
export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2" |
|
|
|
|
|
LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs" |
|
mkdir -p $LOG_DIR |
|
|
|
|
|
TIMESTAMP=$(date +%Y%m%d_%H%M%S) |
|
SAFE_PROBLEM_ID=$(echo $PROBLEM_ID | tr '/' '_') |
|
LOG_FILE="$LOG_DIR/single_problem_${SAFE_PROBLEM_ID}_${TIMESTAMP}.log" |
|
|
|
echo "π― νΉμ λ¬Έμ νμ΅ μμ" |
|
echo "ββββββββββββββββββββββββββββββββββββββββ" |
|
echo "π λ¬Έμ ID: $PROBLEM_ID" |
|
echo "π λΌμ΄λ μ: $ROUNDS" |
|
echo "π₯οΈ GPU: $GPU_ID" |
|
echo "π λ‘κ·Έ νμΌ: $LOG_FILE" |
|
echo "ββββββββββββββββββββββββββββββββββββββββ" |
|
echo "" |
|
|
|
|
|
python /home/ubuntu/RLVR/TestTime-RLVR-v2/test/train_ttrlvr_azr.py \ |
|
--benchmark mbpp \ |
|
--problem-id "$PROBLEM_ID" \ |
|
--rounds $ROUNDS \ |
|
--gpu $GPU_ID \ |
|
--model "Qwen/Qwen2.5-7B" \ |
|
2>&1 | tee $LOG_FILE |
|
|
|
echo "" |
|
echo "β
νμ΅ μλ£. λ‘κ·Έ νμΈ: $LOG_FILE" |