aboutsummaryrefslogtreecommitdiffstats
path: root/community/tesseract-ocr/APKBUILD
diff options
context:
space:
mode:
Diffstat (limited to 'community/tesseract-ocr/APKBUILD')
-rw-r--r--community/tesseract-ocr/APKBUILD134
1 files changed, 104 insertions, 30 deletions
diff --git a/community/tesseract-ocr/APKBUILD b/community/tesseract-ocr/APKBUILD
index 39c8fd497a5..0c4e18ec104 100644
--- a/community/tesseract-ocr/APKBUILD
+++ b/community/tesseract-ocr/APKBUILD
@@ -1,34 +1,107 @@
-# Contributor: Carlo Landmeter <clandmeter@gmail.com>
+# Contributor: Carlo Landmeter <clandmeter@alpinelinux.org>
# Maintainer: Francesco Colista <fcolista@alpinelinux.org>
pkgname=tesseract-ocr
-pkgver=4.1.1
-_tdver=4.0.0
-pkgrel=3
+pkgver=5.3.4
+_tdver=4.1.0
+pkgrel=0
pkgdesc="open source OCR engine"
url="https://github.com/tesseract-ocr/tesseract/releases"
-arch="all"
-license="Apache"
-makedepends="automake autoconf libtool leptonica-dev pango-dev icu-dev
- cairo-dev"
+# gigantic package that will most likely never be used here
+arch="all !s390x !armhf !x86 !ppc64le"
+license="Apache-2.0"
+makedepends="
+ autoconf
+ automake
+ cairo-dev
+ icu-dev
+ leptonica-dev
+ libtool
+ opencl-dev
+ pango-dev
+ "
subpackages="$pkgname-dev"
source="$pkgname-$pkgver.tar.gz::https://github.com/tesseract-ocr/tesseract/archive/$pkgver.tar.gz
- https://github.com/tesseract-ocr/tessdata/archive/${_tdver}/tessdata-${_tdver}.tar.gz
- include-time-h.patch
+ https://github.com/tesseract-ocr/tessdata/archive/$_tdver/tessdata-$_tdver.tar.gz
+ "
+builddir="$srcdir"/tesseract-$pkgver
+options="!check" # todo
+
+_langs="
+ afr
+ ara
+ aze
+ bel
+ ben
+ bul
+ cat
+ ces
+ chi_sim
+ chi_tra
+ chr
+ dan
+ deu
+ eng
+ enm
+ epo
+ equ
+ est
+ eus
+ fin
+ fra
+ frk
+ frm
+ glg
+ grc
+ heb
+ hin
+ hrv
+ hun
+ ind
+ isl
+ ita
+ ita_old
+ jpn
+ kan
+ kat
+ khm
+ kor
+ lav
+ lit
+ mal
+ mkd
+ mlt
+ msa
+ nld
+ nor
+ osd
+ pol
+ por
+ ron
+ rus
+ slk
+ slv
+ spa
+ spa_old
+ sqi
+ srp
+ swa
+ swe
+ tam
+ tel
+ tgl
+ tha
+ tur
+ ukr
+ vie
"
-_langs="afr ara aze bel ben bul cat ces chi_sim chi_tra chr dan deu ell
-enm epo equ est eus fin fra frk frm glg grc heb hin hrv hun ind isl ita
-ita_old jpn kan kor lav lit mal mkd mlt msa nld nor pol por ron rus slk
-slv spa spa_old sqi srp swa swe tam tel tgl tha tur ukr vie"
for _lang in $_langs; do
subpackages="$subpackages $pkgname-data-$_lang:_lang_data:noarch"
done
-builddir="$srcdir"/${pkgname/-*}-$pkgver
-
prepare() {
default_prepare
- ./autogen.sh
+ GIT_DIR=. ./autogen.sh
}
build() {
@@ -40,7 +113,8 @@ build() {
--mandir=/usr/share/man \
--infodir=/usr/share/info \
--localstatedir=/var \
- --disable-static
+ --disable-static \
+ --enable-opencl
make
make training
}
@@ -48,21 +122,21 @@ build() {
package() {
make DESTDIR="$pkgdir" install
make DESTDIR="$pkgdir" training-install
- install -D "$srcdir"/tessdata-$_tdver/eng.* \
- "$srcdir"/tessdata-$_tdver/osd.* \
- "$srcdir"/tessdata-$_tdver/equ.* \
- "$pkgdir"/usr/share/tessdata/
+ local lang
+ for lang in $_langs; do
+ install -Dm644 -t "$pkgdir"/usr/share/tessdata \
+ "$srcdir"/tessdata-$_tdver/$lang.traineddata
+ done
}
_lang_data() {
- local lang="${subpkgname#$pkgname-data-}"
+ local lang=${subpkgname#"$pkgname"-data-}
pkgdesc="Tesseract language data for $lang"
- depends="$pkgname"
- mkdir -p "$subpkgdir"/usr/share/tessdata
- mv "$srcdir"/tessdata-$_tdver/$lang.* \
- "$subpkgdir"/usr/share/tessdata/
+ depends="$pkgname=$pkgver-r$pkgrel"
+ amove usr/share/tessdata/$lang.*
}
-sha512sums="017723a2268be789fe98978eed02fd294968cc8050dde376dee026f56f2b99df42db935049ae5e72c4519a920e263b40af1a6a40d9942e66608145b3131a71a2 tesseract-ocr-4.1.1.tar.gz
-cd71bb99d44eefb53b359ba64b472c509fff773b2737a8d51e10d5d52d9a3a7ff870d470b1c72a7c78be3263b5ecfbb58a6eab13cf7128d8599681676cdcef6b tessdata-4.0.0.tar.gz
-3cc100bfa4eccac4123311c90626e747576b9d4b8b998f5e12bf6b2b9b0ffd8d9ea0160d11747e09d00283c4f782147c9b97c7b5c31679fb44784c2314de3cab include-time-h.patch"
+sha512sums="
+a81c98c3754a71093df7b51390ccd43d05f661352b4cb564e403b96d81909664c2ecbf2eb6f37614c4639e6dadbf2329b926d09271dbbdaa302f2d7b6b0d628a tesseract-ocr-5.3.4.tar.gz
+c0b55fb5542d25ebd4b56d25155cc8254027c9503af298641686388886403ee26ebf9ef47d21d530d372deeba6a01f6eb17705e1ab46bb02f9f7bf4f63805cd0 tessdata-4.1.0.tar.gz
+"