Spaces:

Dagriffpatchfan
/

5000tokens-1

Running

Dagriffpatchfan commited on 7 days ago

Commit

5267def

verified ·

1 Parent(s): 9a3860f

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,8 +2,8 @@ FROM ghcr.io/ggml-org/llama.cpp:full
 RUN apt update && apt install wget -y
-# This line downloads the high-quality F16 model
 RUN wget "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF/resolve/main/gemma-3-270m-it-F16.gguf" -O /gemma-3-270m-it-F16.gguf
-# This command tells the server to load the F16 model on startup
-CMD ["--server", "-m", "/gemma-3-270m-it-F16.gguf", "--port", "7860", "--host", "0.0.0.0", "-c", "5000", "-n", "4000", "-t", "8", "--mlock"]

 RUN apt update && apt install wget -y
 RUN wget "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF/resolve/main/gemma-3-270m-it-F16.gguf" -O /gemma-3-270m-it-F16.gguf
+# Optimized for Gemma 3's native 32k context window.
+# WARNING: Hardware limitations (RAM/CPU) are the main concern.
+CMD ["--server", "-m", "/gemma-3-270m-it-F16.gguf", "--port", "7860", "--host", "0.0.0.0", "-c", "32000", "-n", "4000", "-t", "8", "--mlock"]