Dagriffpatchfan commited on
Commit
5267def
·
verified ·
1 Parent(s): 9a3860f

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +3 -3
Dockerfile CHANGED
@@ -2,8 +2,8 @@ FROM ghcr.io/ggml-org/llama.cpp:full
2
 
3
  RUN apt update && apt install wget -y
4
 
5
- # This line downloads the high-quality F16 model
6
  RUN wget "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF/resolve/main/gemma-3-270m-it-F16.gguf" -O /gemma-3-270m-it-F16.gguf
7
 
8
- # This command tells the server to load the F16 model on startup
9
- CMD ["--server", "-m", "/gemma-3-270m-it-F16.gguf", "--port", "7860", "--host", "0.0.0.0", "-c", "5000", "-n", "4000", "-t", "8", "--mlock"]
 
 
2
 
3
  RUN apt update && apt install wget -y
4
 
 
5
  RUN wget "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF/resolve/main/gemma-3-270m-it-F16.gguf" -O /gemma-3-270m-it-F16.gguf
6
 
7
+ # Optimized for Gemma 3's native 32k context window.
8
+ # WARNING: Hardware limitations (RAM/CPU) are the main concern.
9
+ CMD ["--server", "-m", "/gemma-3-270m-it-F16.gguf", "--port", "7860", "--host", "0.0.0.0", "-c", "32000", "-n", "4000", "-t", "8", "--mlock"]