|
FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04 |
|
|
|
ENV DEBIAN_FRONTEND=noninteractive |
|
ENV PATH="/root/.local/bin:$PATH" |
|
|
|
|
|
RUN echo "user:x:1000:1000::/home/user:/bin/bash" >> /etc/passwd && \ |
|
mkdir -p /home/user && chown 1000:1000 /home/user |
|
|
|
|
|
RUN apt-get update && apt-get install -y \ |
|
python3.10 \ |
|
python3.10-venv \ |
|
python3.10-distutils \ |
|
python3-pip \ |
|
curl \ |
|
git \ |
|
ffmpeg \ |
|
libsndfile1 \ |
|
&& apt-get clean |
|
|
|
|
|
RUN ln -sf /usr/bin/python3.10 /usr/bin/python && \ |
|
ln -sf /usr/bin/pip3 /usr/bin/pip |
|
|
|
|
|
RUN curl -Ls https://astral.sh/uv/install.sh | bash && \ |
|
~/.local/bin/uv pip install --system "vllm[audio]" --extra-index-url https://wheels.vllm.ai/nightly |
|
|
|
|
|
RUN pip install huggingface_hub |
|
|
|
|
|
RUN python -c "from huggingface_hub import snapshot_download; snapshot_download('mistralai/Voxtral-Mini-3B-2507')" |
|
|
|
|
|
EXPOSE 8000 |
|
|
|
|
|
CMD ["vllm", "serve", "mistralai/Voxtral-Mini-3B-2507", "--tokenizer_mode", "mistral", "--config_format", "mistral", "--load_format", "mistral"] |
|
|