FROM ubuntu:22.04 ARG PIP_INSTALL="pip install --no-cache-dir" ARG OCRD_VERSION_MINIMUM="2.23.3" ENV LC_ALL=C.UTF-8 LANG=C.UTF-8 ENV PIP_DEFAULT_TIMEOUT=120 RUN echo "APT::Acquire::Retries \"3\";" > /etc/apt/apt.conf.d/80-retries && \ apt-get update && \ apt-get install -y \ curl xz-utils \ build-essential python3-dev \ # For get-pip.py: python3-distutils \ # For add-apt-repository: software-properties-common \ # XML utils libxml2-utils \ xmlstarlet \ # OCR-D uses ImageMagick for pixel density estimation imagemagick \ && \ apt-get clean && \ rm -rf /var/lib/apt/lists/* # Set up OCR-D logging RUN echo "setOverrideLogLevel(os.getenv('LOG_LEVEL', 'INFO'))" >/etc/ocrd_logging.py # Install pyenv # TODO: do not run as root # TODO: does just saying "3.7" work as intended? ENV HOME=/root ENV PYENV_ROOT=$HOME/.pyenv ENV PATH=$PYENV_ROOT/shims:$PYENV_ROOT/bin:$PATH RUN \ git clone --depth=1 git://github.com/yyuu/pyenv.git .pyenv && \ pyenv install 3.7 && \ pyenv global 3.7 && \ pyenv rehash # Install pip installable-stuff RUN ${PIP_INSTALL} \ "ocrd >= ${OCRD_VERSION_MINIMUM}" # Check pip dependencies RUN pip check WORKDIR /data # Default command CMD ['ocrd']