Spaces:
Running
Running
| FROM pytorch/pytorch:2.4.0-cuda11.8-cudnn9-runtime | |
| COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/ | |
| RUN apt-get update | |
| RUN apt-get install --fix-missing -y -q --no-install-recommends libgomp1 ffmpeg libsm6 pdftohtml libxext6 git ninja-build g++ qpdf pandoc | |
| RUN apt-get install -y ocrmypdf | |
| RUN apt-get install -y tesseract-ocr-fra | |
| RUN apt-get install -y tesseract-ocr-spa | |
| RUN apt-get install -y tesseract-ocr-deu | |
| RUN apt-get install -y tesseract-ocr-ara | |
| RUN apt-get install -y tesseract-ocr-mya | |
| RUN apt-get install -y tesseract-ocr-hin | |
| RUN apt-get install -y tesseract-ocr-tam | |
| RUN apt-get install -y tesseract-ocr-tha | |
| RUN apt-get install -y tesseract-ocr-chi-sim | |
| RUN apt-get install -y tesseract-ocr-tur | |
| RUN apt-get install -y tesseract-ocr-ukr | |
| RUN apt-get install -y tesseract-ocr-ell | |
| RUN apt-get install -y tesseract-ocr-rus | |
| RUN apt-get install -y tesseract-ocr-kor | |
| RUN apt-get install -y tesseract-ocr-kor-vert | |
| RUN mkdir -p /app/src | |
| RUN mkdir -p /app/models | |
| RUN addgroup --system python && adduser --system --group python | |
| RUN chown -R python:python /app | |
| USER python | |
| ENV VIRTUAL_ENV=/app/.venv | |
| RUN python -m venv $VIRTUAL_ENV | |
| ENV PATH="$VIRTUAL_ENV/bin:$PATH" | |
| COPY requirements.txt requirements.txt | |
| RUN uv pip install --upgrade pip | |
| RUN uv pip install -r requirements.txt | |
| WORKDIR /app | |
| RUN cd src; git clone https://github.com/facebookresearch/detectron2; | |
| RUN cd src/detectron2; git checkout 70f454304e1a38378200459dd2dbca0f0f4a5ab4; python setup.py build develop | |
| RUN uv pip install pycocotools==2.0.8 | |
| COPY ./start.sh ./start.sh | |
| COPY ./src/. ./src | |
| COPY ./models/. ./models/ | |
| RUN python src/download_models.py | |
| ENV PYTHONPATH "${PYTHONPATH}:/app/src" | |
| ENV TRANSFORMERS_VERBOSITY=error | |
| ENV TRANSFORMERS_NO_ADVISORY_WARNINGS=1 | |