tesseract-ocr: update to 3.05.00

This commit is contained in:
Jürgen Buchmüller 2017-02-20 20:50:14 +01:00
parent d9678627de
commit 16a23fa962

View file

@ -1,13 +1,13 @@
# Template file for 'tesseract-ocr' # Template file for 'tesseract-ocr'
pkgname=tesseract-ocr pkgname=tesseract-ocr
version=3.04.01 version=3.05.00
revision=2 revision=1
wrksrc=tesseract-${version} wrksrc=tesseract-${version}
_tessdata_ver=6c9657715d38cb44aea9135605860b1b61b0e275 _tessdata_ver=8bf2e7ad08db9ca174ae2b0b3a7498c9f1f71d40
build_style=gnu-configure build_style=gnu-configure
configure_args="LIBLEPT_HEADERSDIR=${XBPS_CROSS_BASE}/usr/include" configure_args="LIBLEPT_HEADERSDIR=${XBPS_CROSS_BASE}/usr/include"
hostmakedepends="automake libtool leptonica" hostmakedepends="automake libtool pkg-config leptonica"
makedepends="pango-devel leptonica-devel" makedepends="cairo-devel pango-devel leptonica-devel icu-devel"
short_desc="Tesseract Open Source OCR engine" short_desc="Tesseract Open Source OCR engine"
maintainer="Jürgen Buchmüller <pullmoll@t-online.de>" maintainer="Jürgen Buchmüller <pullmoll@t-online.de>"
license="Apache-2.0" license="Apache-2.0"
@ -16,8 +16,8 @@ distfiles="
https://github.com/tesseract-ocr/tesseract/archive/${version}.tar.gz>${pkgname}-${version}.tar.gz https://github.com/tesseract-ocr/tesseract/archive/${version}.tar.gz>${pkgname}-${version}.tar.gz
https://github.com/tesseract-ocr/tessdata/archive/${_tessdata_ver}.tar.gz>tessdata-${_tessdata_ver}.tar.gz" https://github.com/tesseract-ocr/tessdata/archive/${_tessdata_ver}.tar.gz>tessdata-${_tessdata_ver}.tar.gz"
checksum=" checksum="
57f63e1b14ae04c3932a2683e4be4954a2849e17edd638ffe91bc5a2156adc6a 3fe83e06d0f73b39f6e92ed9fc7ccba3ef734877b76aa5ddaaa778fac095d996
9da120aa47fc5f2780fb3bf6a346b502607e2b087d1f6857c6d55d5d003ec567" fd5cfdcada2a83aea8c855fbf916e1b34882659f796c10449c78d1385264d5a2"
# Create a package for one specific language $1 # Create a package for one specific language $1
pkg_lang() { pkg_lang() {
@ -35,26 +35,23 @@ post_extract() {
} }
pre_configure() { pre_configure() {
cd ${wrksrc} cd ${wrksrc}
# Some include paths are not set in training/Makefile.am ? # Some include paths are not set in training/Makefile.am
sed -i training/Makefile.am \ # sed -i training/Makefile.am \
-e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/glib-2.0 \\\\" \ # -e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/glib-2.0 \\\\" \
-e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/lib/glib-2.0/include \\\\" \ # -e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/lib/glib-2.0/include \\\\" \
-e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/pango-1.0 \\\\" \ # -e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/pango-1.0 \\\\" \
-e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/cairo \\\\" \ # -e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/cairo \\\\" \
-e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/freetype2 \\\\" # -e "/AM_CPPFLAGS += \\\\/a -I${XBPS_CROSS_BASE}/usr/include/freetype2 \\\\"
./autogen.sh NOCONFIGURE=1 ./autogen.sh
case "$XBPS_TARGET_MACHINE" in }
*-musl) # Don't re-define off_t for musl libc post_build() {
sed -i ${wrksrc}/ccutil/scanutils.cpp \ make ${makejobs} training
-e "/typedef long off_t;/d"
esac
} }
post_install() { post_install() {
# Rename binary to avoid conflict with tesseract package # Rename binary to avoid conflict with tesseract package
mv ${DESTDIR}/usr/bin/tesseract{,-ocr} mv ${DESTDIR}/usr/bin/tesseract{,-ocr}
mv ${DESTDIR}/usr/share/man/man1/tesseract{,-ocr}.1 mv ${DESTDIR}/usr/share/man/man1/tesseract{,-ocr}.1
vdoc ChangeLog vdoc ChangeLog
vdoc ReleaseNotes
vdoc README.md vdoc README.md
vdoc testing/eurotext.tif vdoc testing/eurotext.tif
vdoc testing/phototest.tif vdoc testing/phototest.tif
@ -65,33 +62,33 @@ tesseract-ocr-tools_package() {
short_desc+=" - Tools (development)" short_desc+=" - Tools (development)"
pkg_install() { pkg_install() {
local f local f
make -C training DESTDIR=${DESTDIR} install make DESTDIR=${PKGDESTDIR} training-install
vmkdir usr/share/tesseract # vmkdir usr/share/tesseract
vmkdir usr/share/man/man1 # vmkdir usr/share/man/man1
vmkdir usr/share/man/man5 # vmkdir usr/share/man/man5
# Copy shell scripts # # Copy shell scripts
for f in language-specific.sh tesstrain.sh tesstrain_utils.sh; do # for f in language-specific.sh tesstrain.sh tesstrain_utils.sh; do
if [ -e ${wrksrc}/training/${f} ]; then # if [ -e ${wrksrc}/training/${f} ]; then
cp -a ${wrksrc}/training/${f} \ # cp -a ${wrksrc}/training/${f} \
${PKGDESTDIR}/usr/share/tesseract # ${PKGDESTDIR}/usr/share/tesseract
fi # fi
done # done
# Move binaries and manual pages # # Move binaries and manual pages
for f in ambiguous_words classifier_tester cntraining combine_tessdata \ # for f in ambiguous_words classifier_tester cntraining combine_tessdata \
dawg2wordlist mftraining set_unicharset_properties \ # dawg2wordlist mftraining set_unicharset_properties \
shapeclustering text2image unicharambigs unicharset \ # shapeclustering text2image unicharambigs unicharset \
unicharset_extractor wordlist2dawg; do # unicharset_extractor wordlist2dawg; do
if [ -e ${DESTDIR}/usr/bin/${f} ]; then # if [ -e ${DESTDIR}/usr/bin/${f} ]; then
mv ${DESTDIR}/usr/bin/${f} \ # mv ${DESTDIR}/usr/bin/${f} \
${PKGDESTDIR}/usr/share/tesseract # ${PKGDESTDIR}/usr/share/tesseract
fi # fi
for n in 1 5; do # for n in 1 5; do
if [ -e ${DESTDIR}/usr/share/man/man${n}/${f}.${n} ]; then # if [ -e ${DESTDIR}/usr/share/man/man${n}/${f}.${n} ]; then
mv ${DESTDIR}/usr/share/man/man${n}/${f}.${n} \ # mv ${DESTDIR}/usr/share/man/man${n}/${f}.${n} \
${PKGDESTDIR}/usr/share/man/man${n} # ${PKGDESTDIR}/usr/share/man/man${n}
fi # fi
done # done
done # done
} }
} }
tesseract-ocr-devel_package() { tesseract-ocr-devel_package() {