X-Git-Url: https://git.distorted.org.uk/~mdw/termux-packages/blobdiff_plain/202a1fb5d3efb4affe66cabc1f5ed33de0db1d80..6788ea2c5d7dbb05b18c9da41b1f88f9d4400c2a:/packages/tesseract/build.sh diff --git a/packages/tesseract/build.sh b/packages/tesseract/build.sh index 3f79ad76..5e020320 100644 --- a/packages/tesseract/build.sh +++ b/packages/tesseract/build.sh @@ -18,13 +18,11 @@ termux_step_post_make_install() { # download english trained data cd "${TERMUX_PREFIX}/share/tessdata" rm -f eng.* - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.bigrams - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.fold - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.lm - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.nn - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.params - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.size - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.word-freq - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.tesseract_cube.nn - wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.traineddata + for f in cube.{bigrams,fold,lm,nn,params,size,word-freq} tesseract_cube.nn traineddata; do + f=eng.$f + # From the tessdata README: "These language data files only work with + # Tesseract 4. They are based on the sources in tesseract-ocr/langdata on GitHub. + # Get language data files for Tesseract 3.04 or 3.05 from the 3.04 tree." + termux_download https://raw.githubusercontent.com/tesseract-ocr/tessdata/3.04.00/$f $f + done }