gnu: tesseract-ocr: Update to 4.1.1-1.97079fa

* gnu/packages/ocr.scm (tesseract-ocr): Update to 4.1.1-1.97079fa

Signed-off-by: Jelle Licht <jlicht@fsfe.org>
This commit is contained in:
andy Tai 2021-02-09 23:44:06 -08:00 committed by Jelle Licht
parent c63db58827
commit 822cd628e6
No known key found for this signature in database
GPG key ID: DA4597F947B41025

View file

@ -3,6 +3,7 @@
;;; Copyright © 2016, 2020 Efraim Flashner <efraim@flashner.co.il>
;;; Copyright © 2019 Tobias Geerinckx-Rice <me@tobias.gr>
;;; Copyright © 2019 Alex Vong <alexvong1995@gmail.com>
;;; Copyright © 2021 Andy Tai <atai@atai.org>
;;;
;;; This file is part of GNU Guix.
;;;
@ -26,8 +27,19 @@ (define-module (gnu packages ocr)
#:use-module (guix git-download)
#:use-module (guix build-system gnu)
#:use-module (guix build-system python)
#:use-module (gnu packages)
#:use-module (gnu packages autotools)
#:use-module (gnu packages backup)
#:use-module (gnu packages check)
#:use-module (gnu packages compression)
#:use-module (gnu packages curl)
#:use-module (gnu packages docbook)
#:use-module (gnu packages documentation)
#:use-module (gnu packages gtk)
#:use-module (gnu packages icu4c)
#:use-module (gnu packages pkg-config)
#:use-module (gnu packages python)
#:use-module (gnu packages xml)
#:use-module (gnu packages image))
(define-public ocrad
@ -52,25 +64,62 @@ (define-public ocrad
(license license:gpl3+)))
(define-public tesseract-ocr
;; There are useful commits beyond the last official stable release.
(let ((commit "97079fa353557af6df86fd20b5d2e0dff5d8d5df")
(revision "1"))
(package
(name "tesseract-ocr")
(version "3.04.01")
(version (git-version "4.1.1" revision commit))
(source
(origin
(method git-fetch)
(uri (git-reference
(url "https://github.com/tesseract-ocr/tesseract")
(commit version)))
(commit commit)))
(file-name (git-file-name name version))
(sha256
(base32 "0h1x4z1h86n2gwknd0wck6gykkp99bmm02lg4a47a698g4az6ybv"))))
(base32
"11137a4aaay7qp64vdjd83hz1l089nzi5a0ql0qgk8gn79pyhi98"))))
(build-system gnu-build-system)
(inputs
`(("leptonica" ,leptonica)))
`(("cairo" ,cairo)
("icu" ,icu4c)
("leptonica" ,leptonica)
("pango" ,pango)
("python-wrapper" ,python-wrapper)))
(native-inputs
`(("asciidoc" ,asciidoc)
("autoconf" ,autoconf)
("automake" ,automake)
("docbook-xsl" ,docbook-xsl)
("libarchive" ,libarchive)
("libcurl" ,curl)
("libtool" ,libtool)
("libtiff" ,libtiff)
("pkg-config" ,pkg-config)
("xsltproc" ,libxslt)))
(arguments
'(#:configure-flags
`(#:configure-flags
(let ((leptonica (assoc-ref %build-inputs "leptonica")))
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))))
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))
#:tests? #f ; Tests currently result in a segfault
#:phases
(modify-phases %standard-phases
(add-after 'unpack 'fix-docbook
(lambda* (#:key inputs #:allow-other-keys)
;; Don't attempt to download XSL schema.
(substitute* "doc/Makefile.am"
(("http://docbook.sourceforge.net/release/xsl/current/manpages/docbook.xsl")
(string-append (assoc-ref inputs "docbook-xsl")
"/xml/xsl/docbook-xsl-"
,(package-version docbook-xsl)
"/manpages/docbook.xsl")))))
(add-after 'install 'build-training
(lambda _
(invoke "make" "training")))
(add-after 'build-training 'install-training
(lambda _
(invoke "make" "training-install"))))))
(home-page "https://github.com/tesseract-ocr/tesseract")
(synopsis "Optical character recognition engine")
(description
@ -79,7 +128,7 @@ (define-public tesseract-ocr
positional information and page layout analysis. Several image formats are
supported through the Leptonica library. It can also detect whether text is
monospaced or proportional.")
(license license:asl2.0)))
(license license:asl2.0))))
(define-public zinnia
(let* ((commit "581faa8f6f15e4a7b21964be3a5ec36265c80e5b")
@ -151,3 +200,4 @@ (define-public python2-zinnia
#t)))))
(inputs
`(("zinnia" ,zinnia)))))