component/tesseract: version up 4.1.1
Also enable shared parts and provide new languages: Simplied Chinese, Japanese and French
... | ... | @@ -10,43 +10,34 @@ extends = |
../fontconfig/buildout.cfg | ||
../lcms/buildout.cfg | ||
../pkgconfig/buildout.cfg | ||
./buildout.hash.cfg | ||
parts = | ||
tesseract | ||
tesseract-traineddata | ||
tesseract-eng-traineddata | ||
tesseract-osd-traineddata | ||
[tesseract] | ||
recipe = slapos.recipe.cmmi | ||
url = https://github.com/tesseract-ocr/tesseract/archive/6b250b58121a9858d3e3019a78a6f7d421bd0fc7.tar.gz | ||
md5sum = fdc38148ad8eb1bd0485a217503dd6d5 | ||
shared = true | ||
url = https://github.com/tesseract-ocr/tesseract/archive/refs/tags/4.1.1.tar.gz | ||
md5sum = 51fe2bcbff1bbce77a25d180fd247f7d | ||
pkg_config_depends = ${leptonica:location}/lib/pkgconfig:${fontconfig:location}/lib/pkgconfig:${fontconfig:pkg_config_depends}:${lcms2:location}/lib/pkgconfig:${xz-utils:location}/lib/pkgconfig | ||
pre-configure = | ||
autoreconf -ivf -I${pkgconfig:location}/share/aclocal -I${libtool:location}/share/aclocal -Wno-portability | ||
configure-options = | ||
--disable-static | ||
--datarootdir=${tesseract-traineddata:location} | ||
# XXX: tesseract seems not easily configurable at runtime about where to find | ||
# its trained data, so we set its datarootdir above to a controlled location | ||
|
||
environment = | ||
PATH=${pkgconfig:location}/bin:${autoconf:location}/bin:${automake:location}/bin:${libtool:location}/bin:${m4:location}/bin:${patch:location}/bin:%(PATH)s | ||
PKG_CONFIG_PATH=${:pkg_config_depends} | ||
LDFLAGS=-L${leptonica:location}/lib -Wl,-rpath=${leptonica:location}/lib -L${jbigkit:location}/lib -Wl,-rpath=${jbigkit:location}/lib -L${zlib:location}/lib -Wl,-rpath=${zlib:location}/lib | ||
[tesseract-traineddata] | ||
location = ${buildout:parts-directory}/${:_buildout_section_name_} | ||
post-make-hook = ${tesseract-download-traineddata:post-make-hook} | ||
tessdata-urls = ${tesseract-download-traineddata:urls} | ||
tessdata-location = @@LOCATION@@/share/tessdata/ | ||
[tesseract-eng-traineddata] | ||
recipe = slapos.recipe.build:download | ||
destination = ${tesseract-traineddata:location}/tessdata/eng.traineddata | ||
url = https://github.com/tesseract-ocr/tessdata/raw/590567f20dc044f6948a8e2c61afc714c360ad0e/eng.traineddata | ||
md5sum = 57e0df3d84fed9fbf8c7a8e589f8f012 | ||
[tesseract-osd-traineddata] | ||
recipe = slapos.recipe.build:download | ||
destination = ${tesseract-traineddata:location}/tessdata/osd.traineddata | ||
url = https://github.com/tesseract-ocr/tessdata/raw/590567f20dc044f6948a8e2c61afc714c360ad0e/osd.traineddata | ||
md5sum = 7611737524efd1ce2dde67eff629bbcf | ||
[tesseract-download-traineddata] | ||
post-make-hook = ${:_profile_base_location_}/${download-tessdata.py:filename}#${download-tessdata.py:md5sum}:post_make_hook | ||
urls = | ||
https://raw.githubusercontent.com/tesseract-ocr/tessdata/4.1.0/eng.traineddata#57e0df3d84fed9fbf8c7a8e589f8f012 | ||
https://raw.githubusercontent.com/tesseract-ocr/tessdata/4.1.0/osd.traineddata#7611737524efd1ce2dde67eff629bbcf | ||
https://raw.githubusercontent.com/tesseract-ocr/tessdata/4.1.0/fra.traineddata#a73e70c872f262895d93976febeb1638 | ||
https://raw.githubusercontent.com/tesseract-ocr/tessdata/4.1.0/jpn.traineddata#af3a30a9bec904e106aa8521e7caaeca | ||
https://raw.githubusercontent.com/tesseract-ocr/tessdata/4.1.0/chi_sim.traineddata#6965cb3213edd961cb16264e2ea45f5c |