Spaces:
Sleeping
Sleeping
Upload Dockerfile
Browse files- Dockerfile +17 -19
Dockerfile
CHANGED
|
@@ -5,12 +5,13 @@ ENV PYTHONUNBUFFERED=1 \
|
|
| 5 |
PIP_NO_CACHE_DIR=1 \
|
| 6 |
HF_HUB_DISABLE_TELEMETRY=1 \
|
| 7 |
PORT=7860 \
|
| 8 |
-
|
| 9 |
-
HF_HOME=/
|
| 10 |
-
TRANSFORMERS_CACHE=/
|
| 11 |
-
SENTENCE_TRANSFORMERS_HOME=/
|
|
|
|
| 12 |
|
| 13 |
-
#
|
| 14 |
RUN apt-get update && apt-get install -y --no-install-recommends curl git && \
|
| 15 |
rm -rf /var/lib/apt/lists/*
|
| 16 |
|
|
@@ -26,30 +27,27 @@ RUN python -m pip install --upgrade pip && \
|
|
| 26 |
# ---- App code ----
|
| 27 |
COPY . .
|
| 28 |
|
| 29 |
-
#
|
| 30 |
-
|
|
|
|
|
|
|
| 31 |
RUN python - <<'PY'
|
| 32 |
from sentence_transformers import SentenceTransformer
|
| 33 |
SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
|
| 34 |
-
print("β
SBERT
|
| 35 |
PY
|
| 36 |
|
| 37 |
-
# 2) Cache NLTK VADER lexicon into /app/nltk_data
|
| 38 |
RUN python - <<'PY'
|
| 39 |
import os, nltk
|
| 40 |
-
os.makedirs("/
|
| 41 |
-
nltk.download("vader_lexicon"
|
| 42 |
-
print("β
|
| 43 |
PY
|
| 44 |
|
| 45 |
-
#
|
| 46 |
-
RUN
|
| 47 |
-
import tldextract
|
| 48 |
-
tldextract.extract("example.com")
|
| 49 |
-
print("β
tldextract PSL cached")
|
| 50 |
-
PY
|
| 51 |
|
| 52 |
EXPOSE 7860
|
| 53 |
|
| 54 |
# ---- Run ----
|
| 55 |
-
CMD ["sh",
|
|
|
|
| 5 |
PIP_NO_CACHE_DIR=1 \
|
| 6 |
HF_HUB_DISABLE_TELEMETRY=1 \
|
| 7 |
PORT=7860 \
|
| 8 |
+
# β
Writable + persistent on HF Spaces:
|
| 9 |
+
HF_HOME=/data/hf_cache \
|
| 10 |
+
TRANSFORMERS_CACHE=/data/hf_cache \
|
| 11 |
+
SENTENCE_TRANSFORMERS_HOME=/data/hf_cache \
|
| 12 |
+
NLTK_DATA=/data/nltk_data
|
| 13 |
|
| 14 |
+
# small tools
|
| 15 |
RUN apt-get update && apt-get install -y --no-install-recommends curl git && \
|
| 16 |
rm -rf /var/lib/apt/lists/*
|
| 17 |
|
|
|
|
| 27 |
# ---- App code ----
|
| 28 |
COPY . .
|
| 29 |
|
| 30 |
+
# β
Make caches writable for the runtime user
|
| 31 |
+
RUN mkdir -p /data/hf_cache /data/nltk_data && chmod -R 777 /data
|
| 32 |
+
|
| 33 |
+
# (optional) pre-warm models into /data caches to speed first run
|
| 34 |
RUN python - <<'PY'
|
| 35 |
from sentence_transformers import SentenceTransformer
|
| 36 |
SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
|
| 37 |
+
print("β
SBERT cached")
|
| 38 |
PY
|
| 39 |
|
|
|
|
| 40 |
RUN python - <<'PY'
|
| 41 |
import os, nltk
|
| 42 |
+
os.makedirs(os.getenv("NLTK_DATA","/data/nltk_data"), exist_ok=True)
|
| 43 |
+
nltk.download("vader_lexicon")
|
| 44 |
+
print("β
VADER cached")
|
| 45 |
PY
|
| 46 |
|
| 47 |
+
# ensure everything under /data is writable after warm
|
| 48 |
+
RUN chmod -R 777 /data
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
|
| 50 |
EXPOSE 7860
|
| 51 |
|
| 52 |
# ---- Run ----
|
| 53 |
+
CMD ["sh","-c","uvicorn main:app --host 0.0.0.0 --port ${PORT:-7860}"]
|