You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
28 lines
587 B
Docker
28 lines
587 B
Docker
FROM ubuntu:18.04
|
|
|
|
ENV LC_ALL=C.UTF-8 LANG=C.UTF-8
|
|
|
|
RUN mkdir /var/lib/calamari-models
|
|
COPY data/calamari-models/GT4HistOCR /var/lib/calamari-models/GT4HistOCR
|
|
|
|
RUN apt-get update && \
|
|
apt-get install -y \
|
|
git \
|
|
libleptonica-dev \
|
|
libtesseract-dev \
|
|
libxml2-utils \
|
|
python3-pip \
|
|
tesseract-ocr-all \
|
|
xmlstarlet \
|
|
&& \
|
|
apt-get clean
|
|
|
|
COPY requirements.txt /tmp
|
|
RUN pip3 install --no-cache-dir -r /tmp/requirements.txt
|
|
|
|
COPY my_ocrd_workflow /usr/bin
|
|
COPY xsd /usr/bin/xsd
|
|
|
|
WORKDIR /data
|
|
CMD ["/usr/bin/my_ocrd_workflow"]
|