termux-packages/packages/tesseract/build.sh

TERMUX_PKG_HOMEPAGE=https://github.com/tesseract-ocr/tesseract
TERMUX_PKG_DESCRIPTION="Tesseract is probably the most accurate open source OCR engine available"
TERMUX_PKG_VERSION=3.05.01
TERMUX_PKG_DEPENDS="libtool, libuuid, leptonica"
TERMUX_PKG_SRCURL=https://github.com/tesseract-ocr/tesseract/archive/${TERMUX_PKG_VERSION}.tar.gz
TERMUX_PKG_SHA256=05898f93c5d057fada49b9a116fc86ad9310ff1726a0f499c3e5211b3af47ec1
TERMUX_PKG_FOLDERNAME=tesseract-${TERMUX_PKG_VERSION}

termux_step_pre_configure() {
	# http://blog.matt-swain.com/post/26419042500/installing-tesseract-ocr-on-mac-os-x-lion
	export LIBLEPT_HEADERSDIR=${TERMUX_PREFIX}/include/leptonica

	perl -p -i -e 's|ADD_RT], true|ADD_RT], false|g' configure.ac
	./autogen.sh
}

termux_step_post_make_install() {
	# download english trained data
	cd "${TERMUX_PREFIX}/share/tessdata"
	rm -f eng.*
	for f in cube.{bigrams,fold,lm,nn,params,size,word-freq} tesseract_cube.nn traineddata; do
		f=eng.$f
		# From the tessdata README: "These language data files only work with
		# Tesseract 4. They are based on the sources in tesseract-ocr/langdata on GitHub.
		# Get language data files for Tesseract 3.04 or 3.05 from the 3.04 tree."
		termux_download \
			https://raw.githubusercontent.com/tesseract-ocr/tessdata/3.04.00/$f \
			$f
	done
}
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`TERMUX_PKG_HOMEPAGE=https://github.com/tesseract-ocr/tesseract`
			`TERMUX_PKG_DESCRIPTION="Tesseract is probably the most accurate open source OCR engine available"`
tesseract: Update from 3.05.00 to 3.05.01 2017-06-07 11:08:13 +02:00			`TERMUX_PKG_VERSION=3.05.01`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`TERMUX_PKG_DEPENDS="libtool, libuuid, leptonica"`
			`TERMUX_PKG_SRCURL=https://github.com/tesseract-ocr/tesseract/archive/${TERMUX_PKG_VERSION}.tar.gz`
tesseract: Update from 3.05.00 to 3.05.01 2017-06-07 11:08:13 +02:00			`TERMUX_PKG_SHA256=05898f93c5d057fada49b9a116fc86ad9310ff1726a0f499c3e5211b3af47ec1`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`TERMUX_PKG_FOLDERNAME=tesseract-${TERMUX_PKG_VERSION}`

			`termux_step_pre_configure() {`
Added fmemopen support to Leptonica 2016-03-27 13:21:42 +02:00			`# http://blog.matt-swain.com/post/26419042500/installing-tesseract-ocr-on-mac-os-x-lion`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`export LIBLEPT_HEADERSDIR=${TERMUX_PREFIX}/include/leptonica`

tesseract: Update from 3.04.01 to 3.05.00 2017-03-27 05:27:36 +02:00			`perl -p -i -e 's\|ADD_RT], true\|ADD_RT], false\|g' configure.ac`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`./autogen.sh`
			`}`

			`termux_step_post_make_install() {`
Added fmemopen support to Leptonica 2016-03-27 13:21:42 +02:00			`# download english trained data`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`cd "${TERMUX_PREFIX}/share/tessdata"`
			`rm -f eng.*`
tesseract: Use termux_download 2016-05-31 11:52:40 +02:00			`for f in cube.{bigrams,fold,lm,nn,params,size,word-freq} tesseract_cube.nn traineddata; do`
			`f=eng.$f`
tesseract: Fix build after tessdata repo updates 2017-01-07 06:59:09 +01:00			`# From the tessdata README: "These language data files only work with`
			`# Tesseract 4. They are based on the sources in tesseract-ocr/langdata on GitHub.`
			`# Get language data files for Tesseract 3.04 or 3.05 from the 3.04 tree."`
tesseract: Update from 3.04.01 to 3.05.00 2017-03-27 05:27:36 +02:00			`termux_download \`
			`https://raw.githubusercontent.com/tesseract-ocr/tessdata/3.04.00/$f \`
			`$f`
tesseract: Use termux_download 2016-05-31 11:52:40 +02:00			`done`
Added Leptonica and Tesseract packages 2016-02-06 13:57:02 +01:00			`}`