tesseract: Update from 3.04.01 to 3.05.00
[termux-packages] / packages / tesseract / build.sh
CommitLineData
93779b4a
DM
1TERMUX_PKG_HOMEPAGE=https://github.com/tesseract-ocr/tesseract
2TERMUX_PKG_DESCRIPTION="Tesseract is probably the most accurate open source OCR engine available"
052e347e 3TERMUX_PKG_VERSION=3.05.00
93779b4a
DM
4TERMUX_PKG_DEPENDS="libtool, libuuid, leptonica"
5TERMUX_PKG_SRCURL=https://github.com/tesseract-ocr/tesseract/archive/${TERMUX_PKG_VERSION}.tar.gz
052e347e 6TERMUX_PKG_SHA256=3fe83e06d0f73b39f6e92ed9fc7ccba3ef734877b76aa5ddaaa778fac095d996
93779b4a
DM
7TERMUX_PKG_FOLDERNAME=tesseract-${TERMUX_PKG_VERSION}
8
9termux_step_pre_configure() {
f2730837 10 # http://blog.matt-swain.com/post/26419042500/installing-tesseract-ocr-on-mac-os-x-lion
93779b4a
DM
11 export LIBLEPT_HEADERSDIR=${TERMUX_PREFIX}/include/leptonica
12
13 cd $TERMUX_PKG_SRCDIR
052e347e 14 perl -p -i -e 's|ADD_RT], true|ADD_RT], false|g' configure.ac
93779b4a
DM
15 ./autogen.sh
16}
17
18termux_step_post_make_install() {
f2730837 19 # download english trained data
93779b4a
DM
20 cd "${TERMUX_PREFIX}/share/tessdata"
21 rm -f eng.*
eb5ac24b
FF
22 for f in cube.{bigrams,fold,lm,nn,params,size,word-freq} tesseract_cube.nn traineddata; do
23 f=eng.$f
bb290b16
FF
24 # From the tessdata README: "These language data files only work with
25 # Tesseract 4. They are based on the sources in tesseract-ocr/langdata on GitHub.
26 # Get language data files for Tesseract 3.04 or 3.05 from the 3.04 tree."
052e347e
FF
27 termux_download \
28 https://raw.githubusercontent.com/tesseract-ocr/tessdata/3.04.00/$f \
29 $f
eb5ac24b 30 done
93779b4a 31}