File size: 1,452 Bytes
24c2665
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
#!/bin/bash
# νŠΉμ • λ¬Έμ œμ— λŒ€ν•΄ TTRLVR + AZR 톡합 ν•™μŠ΅ μ‹€ν–‰

# κΈ°λ³Έ μ„€μ •
GPU_ID=${1:-5}
PROBLEM_ID=${2:-"Mbpp/7"}
ROUNDS=${3:-3}

# ν™˜κ²½ λ³€μˆ˜ μ„€μ •
export CUDA_VISIBLE_DEVICES=$GPU_ID
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export RAY_memory_monitor_refresh_ms=0
export RAY_LOGGING_LEVEL=DEBUG
export HYDRA_FULL_ERROR=1
export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2"

# 둜그 디렉토리
LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs"
mkdir -p $LOG_DIR

# νƒ€μž„μŠ€νƒ¬ν”„
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
SAFE_PROBLEM_ID=$(echo $PROBLEM_ID | tr '/' '_')
LOG_FILE="$LOG_DIR/single_problem_${SAFE_PROBLEM_ID}_${TIMESTAMP}.log"

echo "🎯 νŠΉμ • 문제 ν•™μŠ΅ μ‹œμž‘"
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
echo "πŸ“Œ 문제 ID: $PROBLEM_ID"
echo "πŸ”„ λΌμš΄λ“œ 수: $ROUNDS"
echo "πŸ–₯️  GPU: $GPU_ID"
echo "πŸ“ 둜그 파일: $LOG_FILE"
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
echo ""

# train_ttrlvr_azr.py μ‹€ν–‰
python /home/ubuntu/RLVR/TestTime-RLVR-v2/test/train_ttrlvr_azr.py \
    --benchmark mbpp \
    --problem-id "$PROBLEM_ID" \
    --rounds $ROUNDS \
    --gpu $GPU_ID \
    --model "Qwen/Qwen2.5-7B" \
    2>&1 | tee $LOG_FILE

echo ""
echo "βœ… ν•™μŠ΅ μ™„λ£Œ. 둜그 확인: $LOG_FILE"