diff options
Diffstat (limited to 'graphics/tesseract/tesseract.SlackBuild')
-rw-r--r-- | graphics/tesseract/tesseract.SlackBuild | 89 |
1 files changed, 75 insertions, 14 deletions
diff --git a/graphics/tesseract/tesseract.SlackBuild b/graphics/tesseract/tesseract.SlackBuild index bfc36e41bd..63835762dd 100644 --- a/graphics/tesseract/tesseract.SlackBuild +++ b/graphics/tesseract/tesseract.SlackBuild @@ -1,14 +1,39 @@ #!/bin/sh -# Pierre Cazenave revision date 10/11/2007 +# Pierre Cazenave 10/11/2007. +# Updated 25/01/2009. +# Updated 08/04/2009. +# Updated 28/05/2009 for Slackware64. # Modified by Robby Workman <rworkman@slackbuilds.org> for better -# consistency with our other scripts +# consistency with our other scripts +# Thanks to S+*n_Pe*rm*n for a bug report from OCRopus. + +# Copyright 2009 Pierre Cazenave <pwcazenave {at} gmail [dot] com> +# All rights reserved. +# +# Redistribution and use of this script, with or without modification, is +# permitted provided that the following conditions are met: +# +# 1. Redistributions of this script must retain the above copyright +# notice, this list of conditions and the following disclaimer. +# +# THIS SOFTWARE IS PROVIDED BY THE AUTHOR ''AS IS'' AND ANY EXPRESS OR IMPLIED +# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF +# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO +# EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, +# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, +# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; +# OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, +# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR +# OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF +# ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. PRGNAM=tesseract -VERSION=2.01 +VERSION=2.03 ARCH=${ARCH:-i486} -BUILD=${BUILD:-2} +BUILD=${BUILD:-5} TAG=${TAG:-_SBo} + CWD=$(pwd) TMP=${TMP:-/tmp/SBo} PKG=$TMP/package-$PRGNAM @@ -19,17 +44,22 @@ OUTPUT=${OUTPUT:-/tmp} # of them on the command line (space delimited). If you pass more than one # (again, space delimited), you must enclose the string in quotes. Examples: # TESSLANG=fra ./tesseract.SlackBuild -# TESSLANG="deu eng fra ita nld spa" ./tesseract.SlackBuild +# TESSLANG="deu deu-f eng fra ita nld por spa vie" ./tesseract.SlackBuild TESSLANG=${TESSLANG:-eng} # Default to English if [ "$ARCH" = "i486" ]; then SLKCFLAGS="-O2 -march=i486 -mtune=i686" + LIBDIRSUFFIX="" elif [ "$ARCH" = "i686" ]; then SLKCFLAGS="-O2 -march=i686 -mtune=i686" + LIBDIRSUFFIX="" elif [ "$ARCH" = "x86_64" ]; then SLKCFLAGS="-O2 -fPIC" + LIBDIRSUFFIX="64" fi +set -e + rm -rf $TMP/$PRGNAM-$VERSION $PKG mkdir -p $TMP $PKG $OUTPUT cd $TMP @@ -38,9 +68,21 @@ cd $PRGNAM-$VERSION chown -R root:root . chmod -R u+w,go+r-w,a-s . +# Patch the source with bug report from sister project OCRopus +# http://ocropus.googlecode.com/svn/trunk/tesseract-2.03-patch.diff +# Thanks to S+*n_Pe*rm*n for the bug report. +patch -p1 < $CWD/patches/tesseract-2.03-patch.patch +# Also patch for the java make install error. +# http://tesseract-ocr.googlegroups.com/attach/cd42bea980dbe946/java +# (renamed from java to tesseract-2.03-java.patch) +patch -p1 < $CWD/patches/tesseract-2.03-java.patch +# Fix up some missing includes needed for gcc in 13.0 +patch -p1 < $CWD/patches/tesseract-2.03-missing_includes.patch + CFLAGS="$SLKCFLAGS" \ ./configure \ --prefix=/usr \ + --libdir=/usr/lib${LIBDIRSUFFIX} \ --sysconfdir=/etc \ --localstatedir=/var \ --mandir=/usr/man \ @@ -48,16 +90,29 @@ CFLAGS="$SLKCFLAGS" \ make -# Let's extract the desired language tarballs +# Let's extract the desired language tarballs, with a hack for the different +# version numbers for certain language files. I shied away from wildcards as +# they're a bit unpredictable... for _language in $(echo "$TESSLANG") ; do - if [ -r $CWD/tesseract-2.00.$_language.tar.gz ]; then - tar xf $CWD/tesseract-2.00.$_language.tar.gz - SUCCESS=yes + if [ "$_language" == "deu-f" -o "$_language" == "por" -o "$_language" == "vie" ]; then + if [ -r $CWD/tesseract-2.01.$_language.tar.gz ]; then + tar xf $CWD/tesseract-2.01.$_language.tar.gz + SUCCESS=yes + else + echo "$CWD/tesseract-2.01.$_language.tar.gz not found." + sleep 5 + fi; else - echo "$CWD/tesseract-2.00.$_language.tar.gz not found." - sleep 5 - fi ; + if [ -r $CWD/tesseract-2.00.$_language.tar.gz ]; then + tar xf $CWD/tesseract-2.00.$_language.tar.gz + SUCCESS=yes + else + echo "$CWD/tesseract-2.00.$_language.tar.gz not found." + sleep 5 + fi; + fi done + if [ ! "$SUCCESS" = "yes" ]; then echo "No language packs were found, so this package will not work as is." echo "See $CWD/README for more information." @@ -67,16 +122,22 @@ fi make install DESTDIR=$PKG ( cd $PKG - find . | xargs file | grep "executable" | grep ELF | cut -f 1 -d : | xargs strip --strip-unneeded 2> /dev/null - find . | xargs file | grep "shared object" | grep ELF | cut -f 1 -d : | xargs strip --strip-unneeded 2> /dev/null + find . | xargs file | grep "executable" | grep ELF | cut -f 1 -d : | \ + xargs strip --strip-unneeded 2> /dev/null || true + find . | xargs file | grep "shared object" | grep ELF | cut -f 1 -d : | \ + xargs strip --strip-unneeded 2> /dev/null ) mkdir -p $PKG/usr/doc/$PRGNAM-$VERSION cp -a AUTHORS COPYING ChangeLog INSTALL NEWS README ReleaseNotes \ $PKG/usr/doc/$PRGNAM-$VERSION cat $CWD/$PRGNAM.SlackBuild > $PKG/usr/doc/$PRGNAM-$VERSION/$PRGNAM.SlackBuild +cat $CWD/README > $PKG/usr/doc/$PRGNAM-$VERSION/README$TAG find $PKG/usr/doc/$PRGNAM-$VERSION -type f -exec chmod 644 {} \; +# remove zero size files (from extra potentially not installed language packs). +find $PKG/usr/share/tessdata -type f -size 0 -exec rm {} + + mkdir -p $PKG/install cat $CWD/slack-desc > $PKG/install/slack-desc |