From 93779b4a2b5ab1599b30a2c5fcf51697c7134408 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Mart=C3=ADnez?= Date: Sat, 6 Feb 2016 13:57:02 +0100 Subject: [PATCH 1/3] Added Leptonica and Tesseract packages --- packages/leptonica/build.sh | 7 +++++++ packages/tesseract/build.sh | 29 +++++++++++++++++++++++++++++ 2 files changed, 36 insertions(+) create mode 100644 packages/leptonica/build.sh create mode 100644 packages/tesseract/build.sh diff --git a/packages/leptonica/build.sh b/packages/leptonica/build.sh new file mode 100644 index 000000000..ed15fa77a --- /dev/null +++ b/packages/leptonica/build.sh @@ -0,0 +1,7 @@ +TERMUX_PKG_HOMEPAGE=http://www.leptonica.com/ +TERMUX_PKG_DESCRIPTION="Leptonica is a pedagogically-oriented open source site containing software that is broadly useful for image processing and image analysis applications" +TERMUX_PKG_VERSION=1.73 +TERMUX_PKG_BUILD_REVISION=1 +TERMUX_PKG_DEPENDS="libtiff" +TERMUX_PKG_SRCURL=http://www.leptonica.com/source/leptonica-${TERMUX_PKG_VERSION}.tar.gz +TERMUX_PKG_EXTRA_CONFIGURE_ARGS="--without-giflib --without-libwebp" diff --git a/packages/tesseract/build.sh b/packages/tesseract/build.sh new file mode 100644 index 000000000..928e3bbb6 --- /dev/null +++ b/packages/tesseract/build.sh @@ -0,0 +1,29 @@ +TERMUX_PKG_HOMEPAGE=https://github.com/tesseract-ocr/tesseract +TERMUX_PKG_DESCRIPTION="Tesseract is probably the most accurate open source OCR engine available" +TERMUX_PKG_VERSION=3.04.00 +TERMUX_PKG_BUILD_REVISION=1 +TERMUX_PKG_DEPENDS="libtool, libuuid, leptonica" +TERMUX_PKG_SRCURL=https://github.com/tesseract-ocr/tesseract/archive/${TERMUX_PKG_VERSION}.tar.gz +TERMUX_PKG_FOLDERNAME=tesseract-${TERMUX_PKG_VERSION} + +termux_step_pre_configure() { + export LIBLEPT_HEADERSDIR=${TERMUX_PREFIX}/include/leptonica + + cd $TERMUX_PKG_SRCDIR + perl -p -i -e 's|ADD_RT, true|ADD_RT, false|g' configure.ac + ./autogen.sh +} + +termux_step_post_make_install() { + cd "${TERMUX_PREFIX}/share/tessdata" + rm -f eng.* + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.bigrams + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.fold + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.lm + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.nn + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.params + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.size + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.word-freq + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.tesseract_cube.nn + wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.traineddata +} From 2225c1f45a6d0b1cb9e9b43f65cbf6e3c54cfdd2 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Mart=C3=ADnez?= Date: Tue, 22 Mar 2016 22:36:59 +0100 Subject: [PATCH 2/3] tesseract: added JPEG and PNG support --- packages/leptonica/build.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/packages/leptonica/build.sh b/packages/leptonica/build.sh index ed15fa77a..54195d4a9 100644 --- a/packages/leptonica/build.sh +++ b/packages/leptonica/build.sh @@ -2,6 +2,6 @@ TERMUX_PKG_HOMEPAGE=http://www.leptonica.com/ TERMUX_PKG_DESCRIPTION="Leptonica is a pedagogically-oriented open source site containing software that is broadly useful for image processing and image analysis applications" TERMUX_PKG_VERSION=1.73 TERMUX_PKG_BUILD_REVISION=1 -TERMUX_PKG_DEPENDS="libtiff" +TERMUX_PKG_DEPENDS="libjpeg-turbo, libpng, libtiff" TERMUX_PKG_SRCURL=http://www.leptonica.com/source/leptonica-${TERMUX_PKG_VERSION}.tar.gz -TERMUX_PKG_EXTRA_CONFIGURE_ARGS="--without-giflib --without-libwebp" +TERMUX_PKG_EXTRA_CONFIGURE_ARGS="--without-giflib --without-libwebp CPPFLAGS=-I/data/data/com.termux/files/usr/include" From f27308373c06bcfd2891d6faa804f577c9a68da1 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Mart=C3=ADnez?= Date: Sun, 27 Mar 2016 13:21:42 +0200 Subject: [PATCH 3/3] Added fmemopen support to Leptonica --- packages/leptonica/build.sh | 18 +++++++++++++++++- packages/tesseract/build.sh | 4 +++- 2 files changed, 20 insertions(+), 2 deletions(-) diff --git a/packages/leptonica/build.sh b/packages/leptonica/build.sh index 54195d4a9..e6eaeddf7 100644 --- a/packages/leptonica/build.sh +++ b/packages/leptonica/build.sh @@ -4,4 +4,20 @@ TERMUX_PKG_VERSION=1.73 TERMUX_PKG_BUILD_REVISION=1 TERMUX_PKG_DEPENDS="libjpeg-turbo, libpng, libtiff" TERMUX_PKG_SRCURL=http://www.leptonica.com/source/leptonica-${TERMUX_PKG_VERSION}.tar.gz -TERMUX_PKG_EXTRA_CONFIGURE_ARGS="--without-giflib --without-libwebp CPPFLAGS=-I/data/data/com.termux/files/usr/include" +TERMUX_PKG_EXTRA_CONFIGURE_ARGS="--without-giflib --without-libwebp" + +termux_step_pre_configure() { + export ac_cv_func_fmemopen=yes +} + +termux_step_post_configure() { + # add fmemopen support from https://github.com/j-jorge/android-stdioext + cd $TERMUX_PKG_SRCDIR/src + + wget --quiet https://raw.githubusercontent.com/j-jorge/android-stdioext/master/include/stdioext.h + wget --quiet https://github.com/j-jorge/android-stdioext/raw/master/src/fmemopen.c + wget --quiet https://github.com/j-jorge/android-stdioext/raw/master/src/fopencookie.c + wget --quiet https://raw.githubusercontent.com/j-jorge/android-stdioext/master/src/open_memstream.c + + echo '#include "stdioext.h"' >> alltypes.h +} diff --git a/packages/tesseract/build.sh b/packages/tesseract/build.sh index 928e3bbb6..54ffb71ff 100644 --- a/packages/tesseract/build.sh +++ b/packages/tesseract/build.sh @@ -1,12 +1,13 @@ TERMUX_PKG_HOMEPAGE=https://github.com/tesseract-ocr/tesseract TERMUX_PKG_DESCRIPTION="Tesseract is probably the most accurate open source OCR engine available" -TERMUX_PKG_VERSION=3.04.00 +TERMUX_PKG_VERSION=3.04.01 TERMUX_PKG_BUILD_REVISION=1 TERMUX_PKG_DEPENDS="libtool, libuuid, leptonica" TERMUX_PKG_SRCURL=https://github.com/tesseract-ocr/tesseract/archive/${TERMUX_PKG_VERSION}.tar.gz TERMUX_PKG_FOLDERNAME=tesseract-${TERMUX_PKG_VERSION} termux_step_pre_configure() { + # http://blog.matt-swain.com/post/26419042500/installing-tesseract-ocr-on-mac-os-x-lion export LIBLEPT_HEADERSDIR=${TERMUX_PREFIX}/include/leptonica cd $TERMUX_PKG_SRCDIR @@ -15,6 +16,7 @@ termux_step_pre_configure() { } termux_step_post_make_install() { + # download english trained data cd "${TERMUX_PREFIX}/share/tessdata" rm -f eng.* wget https://raw.githubusercontent.com/tesseract-ocr/tessdata/master/eng.cube.bigrams