summaryrefslogtreecommitdiffstats
path: root/graphics/tesseract/tesseract.SlackBuild
diff options
context:
space:
mode:
Diffstat (limited to 'graphics/tesseract/tesseract.SlackBuild')
-rw-r--r--graphics/tesseract/tesseract.SlackBuild89
1 files changed, 75 insertions, 14 deletions
diff --git a/graphics/tesseract/tesseract.SlackBuild b/graphics/tesseract/tesseract.SlackBuild
index bfc36e41bd..63835762dd 100644
--- a/graphics/tesseract/tesseract.SlackBuild
+++ b/graphics/tesseract/tesseract.SlackBuild
@@ -1,14 +1,39 @@
#!/bin/sh
-# Pierre Cazenave revision date 10/11/2007
+# Pierre Cazenave 10/11/2007.
+# Updated 25/01/2009.
+# Updated 08/04/2009.
+# Updated 28/05/2009 for Slackware64.
# Modified by Robby Workman <rworkman@slackbuilds.org> for better
-# consistency with our other scripts
+# consistency with our other scripts
+# Thanks to S+*n_Pe*rm*n for a bug report from OCRopus.
+
+# Copyright 2009 Pierre Cazenave <pwcazenave {at} gmail [dot] com>
+# All rights reserved.
+#
+# Redistribution and use of this script, with or without modification, is
+# permitted provided that the following conditions are met:
+#
+# 1. Redistributions of this script must retain the above copyright
+# notice, this list of conditions and the following disclaimer.
+#
+# THIS SOFTWARE IS PROVIDED BY THE AUTHOR ''AS IS'' AND ANY EXPRESS OR IMPLIED
+# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
+# EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+# OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+# OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+# ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
PRGNAM=tesseract
-VERSION=2.01
+VERSION=2.03
ARCH=${ARCH:-i486}
-BUILD=${BUILD:-2}
+BUILD=${BUILD:-5}
TAG=${TAG:-_SBo}
+
CWD=$(pwd)
TMP=${TMP:-/tmp/SBo}
PKG=$TMP/package-$PRGNAM
@@ -19,17 +44,22 @@ OUTPUT=${OUTPUT:-/tmp}
# of them on the command line (space delimited). If you pass more than one
# (again, space delimited), you must enclose the string in quotes. Examples:
# TESSLANG=fra ./tesseract.SlackBuild
-# TESSLANG="deu eng fra ita nld spa" ./tesseract.SlackBuild
+# TESSLANG="deu deu-f eng fra ita nld por spa vie" ./tesseract.SlackBuild
TESSLANG=${TESSLANG:-eng} # Default to English
if [ "$ARCH" = "i486" ]; then
SLKCFLAGS="-O2 -march=i486 -mtune=i686"
+ LIBDIRSUFFIX=""
elif [ "$ARCH" = "i686" ]; then
SLKCFLAGS="-O2 -march=i686 -mtune=i686"
+ LIBDIRSUFFIX=""
elif [ "$ARCH" = "x86_64" ]; then
SLKCFLAGS="-O2 -fPIC"
+ LIBDIRSUFFIX="64"
fi
+set -e
+
rm -rf $TMP/$PRGNAM-$VERSION $PKG
mkdir -p $TMP $PKG $OUTPUT
cd $TMP
@@ -38,9 +68,21 @@ cd $PRGNAM-$VERSION
chown -R root:root .
chmod -R u+w,go+r-w,a-s .
+# Patch the source with bug report from sister project OCRopus
+# http://ocropus.googlecode.com/svn/trunk/tesseract-2.03-patch.diff
+# Thanks to S+*n_Pe*rm*n for the bug report.
+patch -p1 < $CWD/patches/tesseract-2.03-patch.patch
+# Also patch for the java make install error.
+# http://tesseract-ocr.googlegroups.com/attach/cd42bea980dbe946/java
+# (renamed from java to tesseract-2.03-java.patch)
+patch -p1 < $CWD/patches/tesseract-2.03-java.patch
+# Fix up some missing includes needed for gcc in 13.0
+patch -p1 < $CWD/patches/tesseract-2.03-missing_includes.patch
+
CFLAGS="$SLKCFLAGS" \
./configure \
--prefix=/usr \
+ --libdir=/usr/lib${LIBDIRSUFFIX} \
--sysconfdir=/etc \
--localstatedir=/var \
--mandir=/usr/man \
@@ -48,16 +90,29 @@ CFLAGS="$SLKCFLAGS" \
make
-# Let's extract the desired language tarballs
+# Let's extract the desired language tarballs, with a hack for the different
+# version numbers for certain language files. I shied away from wildcards as
+# they're a bit unpredictable...
for _language in $(echo "$TESSLANG") ; do
- if [ -r $CWD/tesseract-2.00.$_language.tar.gz ]; then
- tar xf $CWD/tesseract-2.00.$_language.tar.gz
- SUCCESS=yes
+ if [ "$_language" == "deu-f" -o "$_language" == "por" -o "$_language" == "vie" ]; then
+ if [ -r $CWD/tesseract-2.01.$_language.tar.gz ]; then
+ tar xf $CWD/tesseract-2.01.$_language.tar.gz
+ SUCCESS=yes
+ else
+ echo "$CWD/tesseract-2.01.$_language.tar.gz not found."
+ sleep 5
+ fi;
else
- echo "$CWD/tesseract-2.00.$_language.tar.gz not found."
- sleep 5
- fi ;
+ if [ -r $CWD/tesseract-2.00.$_language.tar.gz ]; then
+ tar xf $CWD/tesseract-2.00.$_language.tar.gz
+ SUCCESS=yes
+ else
+ echo "$CWD/tesseract-2.00.$_language.tar.gz not found."
+ sleep 5
+ fi;
+ fi
done
+
if [ ! "$SUCCESS" = "yes" ]; then
echo "No language packs were found, so this package will not work as is."
echo "See $CWD/README for more information."
@@ -67,16 +122,22 @@ fi
make install DESTDIR=$PKG
( cd $PKG
- find . | xargs file | grep "executable" | grep ELF | cut -f 1 -d : | xargs strip --strip-unneeded 2> /dev/null
- find . | xargs file | grep "shared object" | grep ELF | cut -f 1 -d : | xargs strip --strip-unneeded 2> /dev/null
+ find . | xargs file | grep "executable" | grep ELF | cut -f 1 -d : | \
+ xargs strip --strip-unneeded 2> /dev/null || true
+ find . | xargs file | grep "shared object" | grep ELF | cut -f 1 -d : | \
+ xargs strip --strip-unneeded 2> /dev/null
)
mkdir -p $PKG/usr/doc/$PRGNAM-$VERSION
cp -a AUTHORS COPYING ChangeLog INSTALL NEWS README ReleaseNotes \
$PKG/usr/doc/$PRGNAM-$VERSION
cat $CWD/$PRGNAM.SlackBuild > $PKG/usr/doc/$PRGNAM-$VERSION/$PRGNAM.SlackBuild
+cat $CWD/README > $PKG/usr/doc/$PRGNAM-$VERSION/README$TAG
find $PKG/usr/doc/$PRGNAM-$VERSION -type f -exec chmod 644 {} \;
+# remove zero size files (from extra potentially not installed language packs).
+find $PKG/usr/share/tessdata -type f -size 0 -exec rm {} +
+
mkdir -p $PKG/install
cat $CWD/slack-desc > $PKG/install/slack-desc