Spaces:
Running
on
L40S
Running
on
L40S
Update start.sh
Browse files
start.sh
CHANGED
@@ -7,8 +7,8 @@ python3 -m vllm.entrypoints.openai.api_server \
|
|
7 |
--model numind/NuMarkdown-8B-Thinking \
|
8 |
--port 8000 \
|
9 |
--host 0.0.0.0 \
|
10 |
-
--max-model-len
|
11 |
-
--gpu-memory-utilization 0.
|
12 |
--disable-log-requests \
|
13 |
--tensor-parallel-size 1 \
|
14 |
--trust-remote-code > $HOME/app/vllm.log 2>&1 &
|
|
|
7 |
--model numind/NuMarkdown-8B-Thinking \
|
8 |
--port 8000 \
|
9 |
--host 0.0.0.0 \
|
10 |
+
--max-model-len 20000 \
|
11 |
+
--gpu-memory-utilization 0.95 \
|
12 |
--disable-log-requests \
|
13 |
--tensor-parallel-size 1 \
|
14 |
--trust-remote-code > $HOME/app/vllm.log 2>&1 &
|