From 483577c54388b4cb6bd6f85226e44d3d5771e1bb Mon Sep 17 00:00:00 2001 From: Pavel Tomanek Date: Mon, 17 Feb 2025 14:17:06 +0100 Subject: [PATCH] #511 PR version --- 511_tesseract/leptonica.eb | 32 ++++++++++++++++++ 511_tesseract/tesseract.eb | 66 ++++++++++++++++++++++++++++++++++++++ 2 files changed, 98 insertions(+) create mode 100644 511_tesseract/leptonica.eb create mode 100644 511_tesseract/tesseract.eb diff --git a/511_tesseract/leptonica.eb b/511_tesseract/leptonica.eb new file mode 100644 index 00000000..88731b64 --- /dev/null +++ b/511_tesseract/leptonica.eb @@ -0,0 +1,32 @@ +easyblock = 'ConfigureMake' + +name = 'Leptonica' +version = '1.85.0' + +homepage = 'http://www.leptonica.org' +description = """Leptonica is a collection of pedagogically-oriented open source software + that is broadly useful for image processing and image analysis applications.""" + +toolchain = {'name': 'GCCcore', 'version': '13.3.0'} + +source_urls = ['https://github.com/DanBloomberg/leptonica/releases/download/%(version)s/'] +sources = [SOURCELOWER_TAR_GZ] +checksums = ['3745ae3bf271a6801a2292eead83ac926e3a9bc1bf622e9cd4dd0f3786e17205'] + +builddependencies = [('binutils', '2.42')] + +dependencies = [ + ('libpng', '1.6.43'), + ('LibTIFF', '4.6.0'), + ('libjpeg-turbo', '3.0.1'), + ('giflib', '5.2.1'), + ('libwebp', '1.4.0'), + ('zlib', '1.3.1'), +] + +sanity_check_paths = { + 'files': ['bin/convertformat'], + 'dirs': ['include/leptonica', 'lib/pkgconfig'] +} + +moduleclass = 'vis' diff --git a/511_tesseract/tesseract.eb b/511_tesseract/tesseract.eb new file mode 100644 index 00000000..edd4d41c --- /dev/null +++ b/511_tesseract/tesseract.eb @@ -0,0 +1,66 @@ +easyblock = 'CMakeMake' + +name = 'tesseract' +version = '5.5.0' +_tessdata_ver = '4.1.0' + +homepage = 'https://github.com/tesseract-ocr/tesseract' +description = """Tesseract is an optical character recognition engine""" + +toolchain = {'name': 'GCCcore', 'version': '13.3.0'} + +github_account = 'tesseract-ocr' +source_urls = [GITHUB_SOURCE] +sources = [ + '%(version)s.tar.gz', + { + 'source_urls': ['https://github.com/tesseract-ocr/tessdata_best/archive/'], + 'download_filename': '%s.tar.gz' % _tessdata_ver, + 'filename': 'tessdata_best-%s.tar.gz' % _tessdata_ver, + }, +] +checksums = [ + {'5.5.0.tar.gz': 'f2fb34ca035b6d087a42875a35a7a5c4155fa9979c6132365b1e5a28ebc3fc11'}, + {'tessdata_best-4.1.0.tar.gz': 'bb05b738298ae73e7130e2913ed002b49d94cd1cea508e63be1928fe47770b32'}, +] + +builddependencies = [ + ('CMake', '3.29.3'), + ('binutils', '2.42'), + ('pkgconf', '2.2.0'), +] + +dependencies = [ + ('zlib', '1.3.1'), + ('libpng', '1.6.43'), + ('libjpeg-turbo', '3.0.1'), + ('LibTIFF', '4.6.0'), + ('Leptonica', '1.85.0'), + ('libarchive', '3.7.4'), + ('ICU', '75.1'), + ('fontconfig', '2.15.0'), + ('GLib', '2.80.4'), + ('cairo', '1.18.0'), + ('Pango', '1.54.0'), +] + +configopts = ['-DBUILD_SHARED_LIBS=ON', '-DBUILD_SHARED_LIBS=OFF'] + +postinstallcmds = [ + 'rm %(builddir)s/tessdata_best-*/configs', + 'rm -rf %(builddir)s/tessdata_best-*/tessconfigs', + 'mv %(builddir)s/tessdata_best-*/* %(installdir)s/share/tessdata' +] + +modextrapaths = { + 'TESSDATA_PREFIX': 'share/tessdata', +} + +sanity_check_paths = { + 'files': ['bin/tesseract', 'lib/libtesseract.a', 'lib/libtesseract.%s' % SHLIB_EXT], + 'dirs': ['share/tessdata', 'include/tesseract'] +} + +sanity_check_commands = ['tesseract --version', 'tesseract --list-langs'] + +moduleclass = 'vis'