| # νΉμ λ¬Έμ μ λν΄ TTRLVR + AZR ν΅ν© νμ΅ μ€ν | |
| # κΈ°λ³Έ μ€μ | |
| GPU_ID=${1:-5} | |
| PROBLEM_ID=${2:-"Mbpp/7"} | |
| ROUNDS=${3:-3} | |
| # νκ²½ λ³μ μ€μ | |
| export CUDA_VISIBLE_DEVICES=$GPU_ID | |
| export VLLM_ATTENTION_BACKEND=FLASH_ATTN | |
| export RAY_memory_monitor_refresh_ms=0 | |
| export RAY_LOGGING_LEVEL=DEBUG | |
| export HYDRA_FULL_ERROR=1 | |
| export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2" | |
| # λ‘κ·Έ λλ ν 리 | |
| LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs" | |
| mkdir -p $LOG_DIR | |
| # νμμ€ν¬ν | |
| TIMESTAMP=$(date +%Y%m%d_%H%M%S) | |
| SAFE_PROBLEM_ID=$(echo $PROBLEM_ID | tr '/' '_') | |
| LOG_FILE="$LOG_DIR/single_problem_${SAFE_PROBLEM_ID}_${TIMESTAMP}.log" | |
| echo "π― νΉμ λ¬Έμ νμ΅ μμ" | |
| echo "ββββββββββββββββββββββββββββββββββββββββ" | |
| echo "π λ¬Έμ ID: $PROBLEM_ID" | |
| echo "π λΌμ΄λ μ: $ROUNDS" | |
| echo "π₯οΈ GPU: $GPU_ID" | |
| echo "π λ‘κ·Έ νμΌ: $LOG_FILE" | |
| echo "ββββββββββββββββββββββββββββββββββββββββ" | |
| echo "" | |
| # train_ttrlvr_azr.py μ€ν | |
| python /home/ubuntu/RLVR/TestTime-RLVR-v2/test/train_ttrlvr_azr.py \ | |
| --benchmark mbpp \ | |
| --problem-id "$PROBLEM_ID" \ | |
| --rounds $ROUNDS \ | |
| --gpu $GPU_ID \ | |
| --model "Qwen/Qwen2.5-7B" \ | |
| 2>&1 | tee $LOG_FILE | |
| echo "" | |
| echo "β νμ΅ μλ£. λ‘κ·Έ νμΈ: $LOG_FILE" |