File size: 1,452 Bytes
24c2665 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 |
#!/bin/bash
# νΉμ λ¬Έμ μ λν΄ TTRLVR + AZR ν΅ν© νμ΅ μ€ν
# κΈ°λ³Έ μ€μ
GPU_ID=${1:-5}
PROBLEM_ID=${2:-"Mbpp/7"}
ROUNDS=${3:-3}
# νκ²½ λ³μ μ€μ
export CUDA_VISIBLE_DEVICES=$GPU_ID
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export RAY_memory_monitor_refresh_ms=0
export RAY_LOGGING_LEVEL=DEBUG
export HYDRA_FULL_ERROR=1
export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2"
# λ‘κ·Έ λλ ν 리
LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs"
mkdir -p $LOG_DIR
# νμμ€ν¬ν
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
SAFE_PROBLEM_ID=$(echo $PROBLEM_ID | tr '/' '_')
LOG_FILE="$LOG_DIR/single_problem_${SAFE_PROBLEM_ID}_${TIMESTAMP}.log"
echo "π― νΉμ λ¬Έμ νμ΅ μμ"
echo "ββββββββββββββββββββββββββββββββββββββββ"
echo "π λ¬Έμ ID: $PROBLEM_ID"
echo "π λΌμ΄λ μ: $ROUNDS"
echo "π₯οΈ GPU: $GPU_ID"
echo "π λ‘κ·Έ νμΌ: $LOG_FILE"
echo "ββββββββββββββββββββββββββββββββββββββββ"
echo ""
# train_ttrlvr_azr.py μ€ν
python /home/ubuntu/RLVR/TestTime-RLVR-v2/test/train_ttrlvr_azr.py \
--benchmark mbpp \
--problem-id "$PROBLEM_ID" \
--rounds $ROUNDS \
--gpu $GPU_ID \
--model "Qwen/Qwen2.5-7B" \
2>&1 | tee $LOG_FILE
echo ""
echo "β
νμ΅ μλ£. λ‘κ·Έ νμΈ: $LOG_FILE" |