2023-03-15 17:04:59 +01:00
|
|
|
ARG GIT_COMMIT="latest"
|
|
|
|
FROM quratorspk/ocrd-galley-core:$GIT_COMMIT
|
2020-08-14 14:37:20 +02:00
|
|
|
|
2020-12-03 18:45:52 +01:00
|
|
|
ARG PIP_INSTALL="pip install --no-cache-dir"
|
2022-09-09 19:23:35 +02:00
|
|
|
ARG OCRD_OLENA_VERSION="1.3.0"
|
2020-08-14 14:37:20 +02:00
|
|
|
|
2020-09-25 16:11:11 +02:00
|
|
|
|
2020-08-14 14:37:20 +02:00
|
|
|
# Build ocrd_olena
|
|
|
|
RUN apt-get update && \
|
|
|
|
apt-get install -y \
|
|
|
|
imagemagick \
|
|
|
|
&& \
|
|
|
|
apt-get clean && rm -rf /var/lib/apt/lists/*
|
2023-08-11 18:18:19 +02:00
|
|
|
|
|
|
|
# Install olena from .deb
|
2023-08-14 19:40:53 +02:00
|
|
|
RUN curl -sSL --retry 3 -O https://qurator-data.de/~mike.gerber/olena_2.1.0+ocrd-git+2-ubuntu22.04/olena-bin_2.1.0+ocrd-git+2_amd64.deb && \
|
|
|
|
dpkg -i --force-depends olena-bin_2.1.0+ocrd-git+2_amd64.deb && \
|
|
|
|
rm -f olena-bin_2.1.0+ocrd-git+2_amd64.deb && \
|
2020-08-14 14:37:20 +02:00
|
|
|
apt-get update && \
|
|
|
|
apt-get -f install -y && \
|
2023-08-11 18:18:19 +02:00
|
|
|
apt-get clean && rm -rf /var/lib/apt/lists/* && \
|
|
|
|
if ! scribo-cli sauvola --help >/dev/null 2>&1; then echo "Olena/scribo is not installed correctly" >&2; exit 1; fi
|
2020-08-14 17:17:25 +02:00
|
|
|
RUN curl -sSL --retry 3 -o ocrd_olena.tar.gz https://github.com/OCR-D/ocrd_olena/archive/v${OCRD_OLENA_VERSION}.tar.gz && \
|
2020-08-14 14:37:20 +02:00
|
|
|
mkdir ocrd_olena && \
|
|
|
|
tar xvz -C ocrd_olena --strip-components=1 -f ocrd_olena.tar.gz && \
|
|
|
|
cd ocrd_olena && \
|
2023-08-14 20:00:00 +02:00
|
|
|
sed -i 's/^install: deps/install:/' Makefile && \
|
2020-09-25 16:11:11 +02:00
|
|
|
${PIP_INSTALL} ocrd && \
|
2023-08-14 20:00:00 +02:00
|
|
|
apt install xmlstarlet && \
|
2020-08-14 14:37:20 +02:00
|
|
|
make install PREFIX=/usr/local && \
|
|
|
|
cd .. && rm -rf ocrd_olena ocrd_olena.tar.gz
|
|
|
|
|
|
|
|
|
|
|
|
# Check pip dependencies
|
2020-11-19 18:25:10 +01:00
|
|
|
RUN pip check
|
2020-08-14 14:37:20 +02:00
|
|
|
|
|
|
|
|
|
|
|
# Default command
|
|
|
|
CMD ['ocrd-olena-binarize']
|