FROM ubuntu:22.04

ARG PIP_INSTALL="pip install --no-cache-dir"
ARG OCRD_VERSION_MINIMUM="2.47.0"
ENV LC_ALL=C.UTF-8 LANG=C.UTF-8
ENV PIP_DEFAULT_TIMEOUT=120


RUN echo "APT::Acquire::Retries \"3\";" > /etc/apt/apt.conf.d/80-retries && \
    apt-get update && \
    apt-get install -y \
      build-essential \
      curl \
      git \
      xz-utils \
      pkg-config \
# For add-apt-repository:
      software-properties-common \
# XML utils
      libxml2-utils \
      xmlstarlet \
# OCR-D uses ImageMagick for pixel density estimation
      imagemagick \
# pyenv builds
# TODO: builder container?
      libz-dev \
      libssl-dev \
      libbz2-dev \
      liblzma-dev \
      libncurses-dev \
      libffi-dev \
      libreadline-dev \
      libsqlite3-dev \
      libmagic-dev \
    && \
    apt-get clean && \
    rm -rf /var/lib/apt/lists/*


# Set up OCR-D logging
RUN echo "setOverrideLogLevel(os.getenv('LOG_LEVEL', 'INFO'))" >/etc/ocrd_logging.py


# Install pyenv
# TODO: do not run as root
# TODO: does just saying "3.7" work as intended?
ENV HOME=/root
ENV PYENV_ROOT=/usr/local/share/pyenv
ENV PATH=$PYENV_ROOT/shims:$PYENV_ROOT/bin:$PATH
RUN \
    git clone --depth=1 https://github.com/yyuu/pyenv.git $PYENV_ROOT && \
    pyenv install 3.7 && \
    pyenv global 3.7 && \
    pyenv rehash && \
    pip install -U pip wheel && \
    pip install setuptools

# Install pip installable-stuff
RUN ${PIP_INSTALL} \
        "ocrd >= ${OCRD_VERSION_MINIMUM}"


# Check pip dependencies
RUN pip check


WORKDIR /data

# Default command
CMD ['ocrd']