Spaces:
Sleeping
Sleeping
fix(build): set writable TRANSFORMERS_CACHE and pre-download distilbert tokenizer/model
Browse files- Dockerfile +5 -3
Dockerfile
CHANGED
|
@@ -15,10 +15,12 @@ ARG HF_MODEL_REPO=Jaja-09/authorcheck-model
|
|
| 15 |
# Download model snapshot from HF model repo
|
| 16 |
RUN python -c "from huggingface_hub import snapshot_download; snapshot_download(repo_id='${HF_MODEL_REPO}', local_dir='/app/model')"
|
| 17 |
|
| 18 |
-
#
|
| 19 |
ENV NLTK_DATA=/app/nltk_data
|
| 20 |
-
|
| 21 |
-
|
|
|
|
|
|
|
| 22 |
|
| 23 |
EXPOSE 7860
|
| 24 |
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]
|
|
|
|
| 15 |
# Download model snapshot from HF model repo
|
| 16 |
RUN python -c "from huggingface_hub import snapshot_download; snapshot_download(repo_id='${HF_MODEL_REPO}', local_dir='/app/model')"
|
| 17 |
|
| 18 |
+
# Use writable caches inside /app
|
| 19 |
ENV NLTK_DATA=/app/nltk_data
|
| 20 |
+
ENV TRANSFORMERS_CACHE=/app/hf_cache
|
| 21 |
+
RUN mkdir -p /app/nltk_data /app/hf_cache && \
|
| 22 |
+
python -c "import nltk; nltk.download('punkt', download_dir='/app/nltk_data', quiet=True)" && \
|
| 23 |
+
python -c "from transformers import AutoTokenizer, AutoModelForSequenceClassification; m='distilbert-base-uncased-finetuned-sst-2-english'; AutoTokenizer.from_pretrained(m, cache_dir='/app/hf_cache'); AutoModelForSequenceClassification.from_pretrained(m, cache_dir='/app/hf_cache')"
|
| 24 |
|
| 25 |
EXPOSE 7860
|
| 26 |
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]
|