FROM ubuntu:22.04 ARG PIP_INSTALL="pip install --no-cache-dir" ARG OCRD_VERSION_MINIMUM="2.47.0" ENV LC_ALL=C.UTF-8 LANG=C.UTF-8 ENV PIP_DEFAULT_TIMEOUT=120 RUN echo "APT::Acquire::Retries \"3\";" > /etc/apt/apt.conf.d/80-retries && \ apt-get update && \ apt-get install -y \ build-essential \ curl \ git \ xz-utils \ pkg-config \ # For add-apt-repository: software-properties-common \ # XML utils libxml2-utils \ xmlstarlet \ # OCR-D uses ImageMagick for pixel density estimation imagemagick \ # pyenv builds # TODO: builder container? libz-dev \ libssl-dev \ libbz2-dev \ liblzma-dev \ libncurses-dev \ libffi-dev \ libreadline-dev \ libsqlite3-dev \ libmagic-dev \ && \ apt-get clean && \ rm -rf /var/lib/apt/lists/* # Set up OCR-D logging RUN echo "setOverrideLogLevel(os.getenv('LOG_LEVEL', 'INFO'))" >/etc/ocrd_logging.py # Install pyenv # TODO: do not run as root # TODO: does just saying "3.7" work as intended? ENV HOME=/root ENV PYENV_ROOT=/usr/local/share/pyenv ENV PATH=$PYENV_ROOT/shims:$PYENV_ROOT/bin:$PATH RUN \ git clone --depth=1 https://github.com/yyuu/pyenv.git $PYENV_ROOT && \ pyenv install 3.7 && \ pyenv global 3.7 && \ pyenv rehash && \ pip install -U pip wheel && \ pip install setuptools # Install pip installable-stuff RUN ${PIP_INSTALL} \ "ocrd >= ${OCRD_VERSION_MINIMUM}" # Check pip dependencies RUN pip check WORKDIR /data # Default command CMD ['ocrd']