FROM pytorch/pytorch:2.4.0-cuda11.8-cudnn9-runtime COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/ RUN apt-get update RUN apt-get install --fix-missing -y -q --no-install-recommends libgomp1 ffmpeg libsm6 pdftohtml libxext6 git ninja-build g++ qpdf pandoc RUN apt-get install -y ocrmypdf RUN apt-get install -y tesseract-ocr-fra RUN apt-get install -y tesseract-ocr-spa RUN apt-get install -y tesseract-ocr-deu RUN apt-get install -y tesseract-ocr-ara RUN apt-get install -y tesseract-ocr-mya RUN apt-get install -y tesseract-ocr-hin RUN apt-get install -y tesseract-ocr-tam RUN apt-get install -y tesseract-ocr-tha RUN apt-get install -y tesseract-ocr-chi-sim RUN apt-get install -y tesseract-ocr-tur RUN apt-get install -y tesseract-ocr-ukr RUN apt-get install -y tesseract-ocr-ell RUN apt-get install -y tesseract-ocr-rus RUN apt-get install -y tesseract-ocr-kor RUN apt-get install -y tesseract-ocr-kor-vert RUN mkdir -p /app/src RUN mkdir -p /app/models RUN addgroup --system python && adduser --system --group python RUN chown -R python:python /app USER python ENV VIRTUAL_ENV=/app/.venv RUN python -m venv $VIRTUAL_ENV ENV PATH="$VIRTUAL_ENV/bin:$PATH" COPY requirements.txt requirements.txt RUN uv pip install --upgrade pip RUN uv pip install -r requirements.txt WORKDIR /app RUN cd src; git clone https://github.com/facebookresearch/detectron2; RUN cd src/detectron2; git checkout 70f454304e1a38378200459dd2dbca0f0f4a5ab4; python setup.py build develop RUN uv pip install pycocotools==2.0.8 COPY ./start.sh ./start.sh COPY ./src/. ./src COPY ./models/. ./models/ RUN python src/download_models.py ENV PYTHONPATH "${PYTHONPATH}:/app/src" ENV TRANSFORMERS_VERBOSITY=error ENV TRANSFORMERS_NO_ADVISORY_WARNINGS=1