Update to tesseract-5.1.0.

This commit is contained in:
ajacoutot 2022-04-18 15:31:43 +00:00
parent c580007bd1
commit c2c3f10d68
6 changed files with 10 additions and 19 deletions

View File

@ -1,4 +1,4 @@
GH_TAGNAME ?= 4.1.1
GH_TAGNAME ?= 5.1.0
GH_ACCOUNT= tesseract-ocr
CATEGORIES += graphics textproc

View File

@ -1,9 +1,8 @@
COMMENT= OCR Engine developed at HP Labs
GH_PROJECT= tesseract
REVISION= 1
SHARED_LIBS += tesseract 4.0
SHARED_LIBS += tesseract 4.1
WANTLIB += ${COMPILER_LIBCXX} X11 Xext Xrender archive b2 bz2
WANTLIB += c cairo charset crypto curl expat ffi fontconfig freetype
@ -16,6 +15,8 @@ WANTLIB += xcb xcb-render xcb-shm z zstd Xau Xdmcp
# c++11: needed to build the training tools
COMPILER= base-clang ports-gcc
USE_GMAKE= Yes
LIB_DEPENDS= archivers/libarchive \
devel/pango \
graphics/leptonica \

View File

@ -1,2 +1,2 @@
SHA256 (tesseract-4.1.1.tar.gz) = Kmb/DYWVv/jwQDIWXmyTY4mx5XJ8POWiez4FnSGNscs=
SIZE (tesseract-4.1.1.tar.gz) = 1974988
SHA256 (tesseract-5.1.0.tar.gz) = /eyFKNWg7MKKtf/5heC4ztYHJvbvM/VBJvKGjjI9S9I=
SIZE (tesseract-5.1.0.tar.gz) = 1910376

View File

@ -3,7 +3,7 @@ No librt on OpenBSD.
Index: configure.ac
--- configure.ac.orig
+++ configure.ac
@@ -109,6 +109,9 @@ case "${host_os}" in
@@ -112,6 +112,9 @@ case "${host_os}" in
powerpc-*-darwin*)
OPENCL_LIBS=""
;;

View File

@ -6,7 +6,6 @@
@bin bin/combine_lang_model
@bin bin/combine_tessdata
@bin bin/dawg2wordlist
bin/language-specific.sh
@bin bin/lstmeval
@bin bin/lstmtraining
@bin bin/merge_unicharsets
@ -14,31 +13,22 @@ bin/language-specific.sh
@bin bin/set_unicharset_properties
@bin bin/shapeclustering
@bin bin/tesseract
bin/tesstrain.sh
bin/tesstrain_utils.sh
@bin bin/text2image
@bin bin/unicharset_extractor
@bin bin/wordlist2dawg
include/tesseract/
include/tesseract/apitypes.h
include/tesseract/baseapi.h
include/tesseract/capi.h
include/tesseract/genericvector.h
include/tesseract/helpers.h
include/tesseract/export.h
include/tesseract/ltrresultiterator.h
include/tesseract/ocrclass.h
include/tesseract/osdetect.h
include/tesseract/pageiterator.h
include/tesseract/platform.h
include/tesseract/publictypes.h
include/tesseract/renderer.h
include/tesseract/resultiterator.h
include/tesseract/serialis.h
include/tesseract/strngs.h
include/tesseract/tess_version.h
include/tesseract/tesscallback.h
include/tesseract/thresholder.h
include/tesseract/unichar.h
include/tesseract/version.h
@static-lib lib/libtesseract.a
lib/libtesseract.la
@lib lib/libtesseract.so.${LIBtesseract_VERSION}

View File

@ -16,4 +16,4 @@ Here's a quick HOWTO about optical character recognition using:
$ scanimage --mode gray --resolution 300 > scan.pnm
$ unpaper -b 0.5 -w 0.8 -l single scan.pnm scan1.pnm
$ convert scan1.pnm scan.tif
$ tesseract scan.tif scan.txt
$ tesseract scan.tif scan