ocrd-galley/wrapper/qurator/ocrd_galley/cli.py

import os
import subprocess
import sys
import colorama
from pathlib import Path
from termcolor import colored


DOCKER_IMAGE_TAG = os.environ.get("DOCKER_IMAGE_TAG", "maximum")  # TODO rename
LOG_LEVEL = os.environ.get("LOG_LEVEL", "INFO")

# xdg-user-dirs is only available under Python 3.10+ etc. pp. → it is simpler
# to just roll it on our own.
XDG_CONFIG_HOME = os.environ.get("XDG_CONFIG_HOME", Path.home() / ".config")
XDG_DATA_HOME = os.environ.get("XDG_DATA_HOME", Path.home() / ".local" / "share")
XDG_CACHE_HOME = os.environ.get("XDG_CACHE_HOME", Path.home() / ".cache")

# ocrd_tesserocr
TESSDATA_PREFIX = XDG_DATA_HOME / "ocrd-resources" / "ocrd-tesserocr-recognize"

def main():
    colorama.init()

    argv = sys.argv.copy()
    argv[0] = os.path.basename(argv[0])

    docker_image = "ocrd/all:%s" % (DOCKER_IMAGE_TAG, )

    if DOCKER_IMAGE_TAG != "maximum":
        print(colored(f"Using {docker_image}", 'red'))
    docker_run(argv, docker_image)


def docker_run(argv, docker_image):
    docker_run_options = []
    docker_run_options.extend(["--rm", "-t"])
    docker_run_options.extend(["--mount", "type=bind,src=%s,target=/data" % os.getcwd()])
    docker_run_options.extend(["--mount", "type=tmpfs,target=/tmp"])
    docker_run_options.extend(["--user", "%s:%s" % (os.getuid(), os.getgid())])
    docker_run_options.extend(["-e", "LOG_LEVEL=%s" % LOG_LEVEL])
    docker_run_options.extend(["-e", "_OCRD_COMPLETE"])

    # home directory
    docker_run_options.extend(["-e", "HOME=%s" % Path.home()])

    # .config
    docker_run_options.extend(["-e", "XDG_CONFIG_HOME=%s" % XDG_CONFIG_HOME])
    docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %
        (XDG_CONFIG_HOME, XDG_CONFIG_HOME)])
    # .local/share
    docker_run_options.extend(["-e", "XDG_DATA_HOME=%s" % XDG_DATA_HOME])
    docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %
        (XDG_DATA_HOME, XDG_DATA_HOME)])
    # .cache
    docker_run_options.extend(["-e", "XDG_CACHE_HOME=%s" % XDG_CACHE_HOME])
    docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %
        (XDG_CACHE_HOME, XDG_CACHE_HOME)])
    # .huggingface
    os.makedirs(Path.home() / ".huggingface", exist_ok=True)
    docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %
        (Path.home() / ".huggingface", Path("/root") / ".huggingface")])

    # ocrd_tesserocr
    docker_run_options.extend(["-e", "TESSDATA_PREFIX=%s" % TESSDATA_PREFIX])

    # JAVA_TOOL_OPTIONS is used for Java proxy settings
    if os.environ.get("JAVA_TOOL_OPTIONS"):
        docker_run_options.extend(["-e", "JAVA_TOOL_OPTIONS"])

    # The containers currently need to run privileged to allow it to read from e.g.
    # /home on SELinux secured systems such as Fedora. We might want to use udica
    # instead in the future.
    docker_run_options.extend(["--privileged=true"])

    docker_run_options.extend([docker_image])
    docker_run_options.extend(argv)

    docker_run_command = ["docker", "run"] + docker_run_options
    c = subprocess.run(docker_run_command)
    sys.exit(c.returncode)


if __name__ == "__main__":
    main()
🚧 Add a wrapper script to call containers 4 years ago			`import os`
			`import subprocess`
			`import sys`
💄 Make 'Using ...:test-github-actions red' message red 2 years ago			`import colorama`
✨ Add minimal support for using ocrd resmgr 2 years ago			`from pathlib import Path`
💄 Make 'Using ...:test-github-actions red' message red 2 years ago			`from termcolor import colored`
🚧 Add a wrapper script to call containers 4 years ago

🚧 WIP: Migrate to using ocrd:all image + Update tests 8 months ago			`DOCKER_IMAGE_TAG = os.environ.get("DOCKER_IMAGE_TAG", "maximum") # TODO rename`
🚧 Add a wrapper script to call containers 4 years ago			`LOG_LEVEL = os.environ.get("LOG_LEVEL", "INFO")`

✨ Add minimal support for using ocrd resmgr 2 years ago			`# xdg-user-dirs is only available under Python 3.10+ etc. pp. → it is simpler`
			`# to just roll it on our own.`
			`XDG_CONFIG_HOME = os.environ.get("XDG_CONFIG_HOME", Path.home() / ".config")`
			`XDG_DATA_HOME = os.environ.get("XDG_DATA_HOME", Path.home() / ".local" / "share")`
🚧 Add WIP support for ocrd_trocr 2 years ago			`XDG_CACHE_HOME = os.environ.get("XDG_CACHE_HOME", Path.home() / ".cache")`
✨ Add minimal support for using ocrd resmgr 2 years ago
🐛 Fix ocrd resources for ocrd_tesserocr by settting TESSDATA_PREFIX 2 years ago			`# ocrd_tesserocr`
			`TESSDATA_PREFIX = XDG_DATA_HOME / "ocrd-resources" / "ocrd-tesserocr-recognize"`
🚧 Add a wrapper script to call containers 4 years ago
			`def main():`
💄 Make 'Using ...:test-github-actions red' message red 2 years ago			`colorama.init()`

🚧 Add a wrapper script to call containers 4 years ago			`argv = sys.argv.copy()`
			`argv[0] = os.path.basename(argv[0])`

🚧 WIP: Migrate to using ocrd:all image + Update tests 8 months ago			`docker_image = "ocrd/all:%s" % (DOCKER_IMAGE_TAG, )`
🐛 Run the correct image when user called 'ocrd resmgr {download,list-available}' 2 years ago
🚧 WIP: Migrate to using ocrd:all image + Update tests 8 months ago			`if DOCKER_IMAGE_TAG != "maximum":`
💄 Make 'Using ...:test-github-actions red' message red 2 years ago			`print(colored(f"Using {docker_image}", 'red'))`
🚧 Add a wrapper script to call containers 4 years ago			`docker_run(argv, docker_image)`


			`def docker_run(argv, docker_image):`
			`docker_run_options = []`
			`docker_run_options.extend(["--rm", "-t"])`
			`docker_run_options.extend(["--mount", "type=bind,src=%s,target=/data" % os.getcwd()])`
🚧 WIP: Migrate to using ocrd:all image + Update tests 8 months ago			`docker_run_options.extend(["--mount", "type=tmpfs,target=/tmp"])`
🚧 Add a wrapper script to call containers 4 years ago			`docker_run_options.extend(["--user", "%s:%s" % (os.getuid(), os.getgid())])`
			`docker_run_options.extend(["-e", "LOG_LEVEL=%s" % LOG_LEVEL])`
✨ Support ocrd tab completion through the wrapper 3 years ago			`docker_run_options.extend(["-e", "_OCRD_COMPLETE"])`
🚧 Add a wrapper script to call containers 4 years ago
🚧 Add WIP support for ocrd_trocr 2 years ago			`# home directory`
			`docker_run_options.extend(["-e", "HOME=%s" % Path.home()])`

🐛 Fix ocrd resources for ocrd_tesserocr by settting TESSDATA_PREFIX 2 years ago			`# .config`
✨ Add minimal support for using ocrd resmgr 2 years ago			`docker_run_options.extend(["-e", "XDG_CONFIG_HOME=%s" % XDG_CONFIG_HOME])`
			`docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %`
			`(XDG_CONFIG_HOME, XDG_CONFIG_HOME)])`
🐛 Fix ocrd resources for ocrd_tesserocr by settting TESSDATA_PREFIX 2 years ago			`# .local/share`
✨ Add minimal support for using ocrd resmgr 2 years ago			`docker_run_options.extend(["-e", "XDG_DATA_HOME=%s" % XDG_DATA_HOME])`
			`docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %`
			`(XDG_DATA_HOME, XDG_DATA_HOME)])`
🚧 Add WIP support for ocrd_trocr 2 years ago			`# .cache`
			`docker_run_options.extend(["-e", "XDG_CACHE_HOME=%s" % XDG_CACHE_HOME])`
			`docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %`
			`(XDG_CACHE_HOME, XDG_CACHE_HOME)])`
			`# .huggingface`
			`os.makedirs(Path.home() / ".huggingface", exist_ok=True)`
			`docker_run_options.extend(["--mount", "type=bind,src=%s,target=%s" %`
			`(Path.home() / ".huggingface", Path("/root") / ".huggingface")])`
✨ Add minimal support for using ocrd resmgr 2 years ago
🐛 Fix ocrd resources for ocrd_tesserocr by settting TESSDATA_PREFIX 2 years ago			`# ocrd_tesserocr`
			`docker_run_options.extend(["-e", "TESSDATA_PREFIX=%s" % TESSDATA_PREFIX])`

🐛 ocrd-galley: APass through JAVA_TOOL_OPTIONS for ocrd_fileformat 4 years ago			`# JAVA_TOOL_OPTIONS is used for Java proxy settings`
			`if os.environ.get("JAVA_TOOL_OPTIONS"):`
			`docker_run_options.extend(["-e", "JAVA_TOOL_OPTIONS"])`

🚧 Add a wrapper script to call containers 4 years ago			`# The containers currently need to run privileged to allow it to read from e.g.`
			`# /home on SELinux secured systems such as Fedora. We might want to use udica`
			`# instead in the future.`
			`docker_run_options.extend(["--privileged=true"])`

			`docker_run_options.extend([docker_image])`
			`docker_run_options.extend(argv)`

			`docker_run_command = ["docker", "run"] + docker_run_options`
			`c = subprocess.run(docker_run_command)`
			`sys.exit(c.returncode)`


			`if __name__ == "__main__":`
			`main()`