Commit
·
c66163e
1
Parent(s):
53a76ed
chore: set HF caches to /data/hf and install accelerate for faster model load
Browse files- Dockerfile +9 -3
Dockerfile
CHANGED
|
@@ -5,7 +5,11 @@ FROM python:3.10-slim
|
|
| 5 |
ENV PIP_NO_CACHE_DIR=1 \
|
| 6 |
PYTHONDONTWRITEBYTECODE=1 \
|
| 7 |
PYTHONUNBUFFERED=1 \
|
| 8 |
-
HF_HUB_ENABLE_HF_TRANSFER=1
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
|
| 10 |
WORKDIR /app
|
| 11 |
|
|
@@ -29,10 +33,12 @@ RUN python -m pip install --upgrade pip && \
|
|
| 29 |
# CPU-only torch to avoid CUDA/xformers issues on Spaces CPU images
|
| 30 |
python -m pip install --index-url https://download.pytorch.org/whl/cpu torch torchvision torchaudio --upgrade --force-reinstall && \
|
| 31 |
# Ensure xformers is not installed
|
| 32 |
-
python -m pip uninstall -y xformers || true
|
|
|
|
|
|
|
| 33 |
|
| 34 |
EXPOSE 7860
|
| 35 |
|
| 36 |
ENV DATA_DIR=/data
|
| 37 |
-
RUN mkdir -p /data && chmod -R 777 /data
|
| 38 |
CMD ["python", "-m", "uvicorn", "server:app", "--host", "0.0.0.0", "--port", "7860"]
|
|
|
|
| 5 |
ENV PIP_NO_CACHE_DIR=1 \
|
| 6 |
PYTHONDONTWRITEBYTECODE=1 \
|
| 7 |
PYTHONUNBUFFERED=1 \
|
| 8 |
+
HF_HUB_ENABLE_HF_TRANSFER=1 \
|
| 9 |
+
HF_HOME=/data/hf \
|
| 10 |
+
TRANSFORMERS_CACHE=/data/hf \
|
| 11 |
+
DIFFUSERS_CACHE=/data/hf \
|
| 12 |
+
HUGGINGFACE_HUB_CACHE=/data/hf
|
| 13 |
|
| 14 |
WORKDIR /app
|
| 15 |
|
|
|
|
| 33 |
# CPU-only torch to avoid CUDA/xformers issues on Spaces CPU images
|
| 34 |
python -m pip install --index-url https://download.pytorch.org/whl/cpu torch torchvision torchaudio --upgrade --force-reinstall && \
|
| 35 |
# Ensure xformers is not installed
|
| 36 |
+
python -m pip uninstall -y xformers || true && \
|
| 37 |
+
# Speed up and lower RAM during model load
|
| 38 |
+
python -m pip install accelerate
|
| 39 |
|
| 40 |
EXPOSE 7860
|
| 41 |
|
| 42 |
ENV DATA_DIR=/data
|
| 43 |
+
RUN mkdir -p /data /data/hf && chmod -R 777 /data /data/hf
|
| 44 |
CMD ["python", "-m", "uvicorn", "server:app", "--host", "0.0.0.0", "--port", "7860"]
|