liamcripwell commited on
Commit
7e4b5d9
·
verified ·
1 Parent(s): 841fa30

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +2 -2
start.sh CHANGED
@@ -7,8 +7,8 @@ python3 -m vllm.entrypoints.openai.api_server \
7
  --model numind/NuMarkdown-8B-Thinking \
8
  --port 8000 \
9
  --host 0.0.0.0 \
10
- --max-model-len 8048 \
11
- --gpu-memory-utilization 0.9 \
12
  --disable-log-requests \
13
  --tensor-parallel-size 1 \
14
  --trust-remote-code > $HOME/app/vllm.log 2>&1 &
 
7
  --model numind/NuMarkdown-8B-Thinking \
8
  --port 8000 \
9
  --host 0.0.0.0 \
10
+ --max-model-len 20000 \
11
+ --gpu-memory-utilization 0.95 \
12
  --disable-log-requests \
13
  --tensor-parallel-size 1 \
14
  --trust-remote-code > $HOME/app/vllm.log 2>&1 &