rwkv-hf-space / Dockerfile
sparkleman
UPDATE: Add frontend
adb6ad5
raw
history blame
2 kB
ARG CUDA_IMAGE="12.4.0-runtime-ubuntu22.04"
FROM nvidia/cuda:${CUDA_IMAGE}
RUN <<EOF
apt update
apt install --no-install-recommends -y \
build-essential \
git
apt clean && rm -rf /var/lib/apt/lists/*
EOF
# 安装Node.js和npm
RUN curl -fsSL https://deb.nodesource.com/setup_lts.x | bash - && \
apt-get install -y nodejs
# 安装pnpm
RUN npm install -g pnpm
# 克隆前端仓库并构建
RUN git clone https://github.com/SolomonLeon/web-rwkv-realweb.git /frontend
WORKDIR /frontend
RUN pnpm install && pnpm run build
COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/
COPY . .
RUN useradd -m -u 1000 user
USER user
ENV HOME=/home/user \
PATH=/home/user/.local/bin:$PATH
WORKDIR $HOME/app
COPY --chown=user . $HOME/app
COPY --chown=user /frontend/dist $HOME/app/dist-frontend
RUN cat > $HOME/app/config.local.yaml<<EOF
HOST: "0.0.0.0"
PORT: 7860
STRATEGY: "cuda fp16"
RWKV_CUDA_ON: False
CHUNK_LEN: 256
MODELS:
- SERVICE_NAME: "RWKV-x070-World-0.1B-v2.8-20241210-ctx4096"
DOWNLOAD_MODEL_FILE_NAME: "RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth"
DOWNLOAD_MODEL_REPO_ID: "BlinkDL/rwkv-7-world"
DOWNLOAD_MODEL_DIR: "./"
REASONING: False
DEFAULT: True
DEFAULT_SAMPLER:
max_tokens: 512
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
- SERVICE_NAME: "RWKV7-G1-0.1B-68%trained-20250303-ctx4k"
DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-0.1B-68%trained-20250303-ctx4k.pth"
DOWNLOAD_MODEL_REPO_ID: "BlinkDL/temp-latest-training-models"
DOWNLOAD_MODEL_DIR: "./"
REASONING: True
DEFAULT: True
DEFAULT_SAMPLER:
max_tokens: 4096
temperature: 1.0
top_p: 0.3
presence_penalty: 0.5
count_penalty: 0.5
penalty_decay: 0.996
stop:
- "\n\n"
EOF
RUN uv sync --frozen --extra cu124
CMD ["uv","run","app.py",]