2019-06-24 16:36:19 +02:00
|
|
|
FROM ubuntu:18.04
|
|
|
|
|
|
|
|
ENV LC_ALL=C.UTF-8 LANG=C.UTF-8
|
|
|
|
|
|
|
|
RUN apt-get update && \
|
|
|
|
apt-get install -y \
|
|
|
|
git \
|
|
|
|
libleptonica-dev \
|
|
|
|
libtesseract-dev \
|
|
|
|
libxml2-utils \
|
|
|
|
python3-pip \
|
|
|
|
tesseract-ocr-all \
|
|
|
|
xmlstarlet \
|
|
|
|
&& \
|
|
|
|
apt-get clean
|
|
|
|
|
|
|
|
COPY requirements.txt /tmp
|
2019-07-02 17:31:42 +02:00
|
|
|
RUN pip3 install --no-cache-dir -r /tmp/requirements.txt
|
2019-06-24 16:36:19 +02:00
|
|
|
|
|
|
|
COPY my_ocrd_workflow /usr/bin
|
|
|
|
COPY xsd /usr/bin/xsd
|
|
|
|
|
2019-08-13 18:13:49 +02:00
|
|
|
# XXX Hack
|
|
|
|
COPY ../experiments/ocr-eval /usr/local/ocr-eval
|
|
|
|
RUN pip3 install --no-cache-dir -r /usr/local/ocr-eval/requirements.txt
|
|
|
|
|
2019-06-24 16:36:19 +02:00
|
|
|
|
|
|
|
WORKDIR /data
|
|
|
|
CMD ["/usr/bin/my_ocrd_workflow"]
|