mirror of
https://github.com/qurator-spk/ocrd-galley.git
synced 2025-06-09 22:59:53 +02:00
✨ Use sbb_textline_detector to segment lines
This commit is contained in:
parent
735e9599d7
commit
6454d20998
6 changed files with 49 additions and 11 deletions
|
@ -17,6 +17,8 @@ RUN apt-get update && \
|
|||
cmake libgif-dev libjpeg-dev libpng-dev libtiff-dev zlib1g-dev \
|
||||
# For clstm on Ubuntu 19.04:
|
||||
swig libeigen3-dev libpng-dev libprotobuf-dev \
|
||||
# For cv2:
|
||||
libsm6 libxrender1 \
|
||||
# XML utils
|
||||
libxml2-utils \
|
||||
xmlstarlet \
|
||||
|
@ -53,6 +55,11 @@ COPY data/tesseract-models/GT4HistOCR/GT4HistOCR_2000000.traineddata $TESSDATA_P
|
|||
RUN tesseract --list-langs
|
||||
|
||||
|
||||
# Copy over sbb_textline_detector
|
||||
COPY vendor vendor
|
||||
COPY data/textline_detection /var/lib/textline_detection
|
||||
|
||||
|
||||
COPY requirements.txt /tmp
|
||||
RUN pip3 install --no-cache-dir -r /tmp/requirements.txt
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue