mirror of
https://git.in.rschanz.org/ryan77627/guix.git
synced 2024-12-27 23:02:16 -05:00
gnu: tesseract-ocr: Update to 4.1.1-1.97079fa
* gnu/packages/ocr.scm (tesseract-ocr): Update to 4.1.1-1.97079fa Signed-off-by: Jelle Licht <jlicht@fsfe.org>
This commit is contained in:
parent
c63db58827
commit
822cd628e6
1 changed files with 74 additions and 24 deletions
|
@ -3,6 +3,7 @@
|
|||
;;; Copyright © 2016, 2020 Efraim Flashner <efraim@flashner.co.il>
|
||||
;;; Copyright © 2019 Tobias Geerinckx-Rice <me@tobias.gr>
|
||||
;;; Copyright © 2019 Alex Vong <alexvong1995@gmail.com>
|
||||
;;; Copyright © 2021 Andy Tai <atai@atai.org>
|
||||
;;;
|
||||
;;; This file is part of GNU Guix.
|
||||
;;;
|
||||
|
@ -26,8 +27,19 @@ (define-module (gnu packages ocr)
|
|||
#:use-module (guix git-download)
|
||||
#:use-module (guix build-system gnu)
|
||||
#:use-module (guix build-system python)
|
||||
#:use-module (gnu packages)
|
||||
#:use-module (gnu packages autotools)
|
||||
#:use-module (gnu packages backup)
|
||||
#:use-module (gnu packages check)
|
||||
#:use-module (gnu packages compression)
|
||||
#:use-module (gnu packages curl)
|
||||
#:use-module (gnu packages docbook)
|
||||
#:use-module (gnu packages documentation)
|
||||
#:use-module (gnu packages gtk)
|
||||
#:use-module (gnu packages icu4c)
|
||||
#:use-module (gnu packages pkg-config)
|
||||
#:use-module (gnu packages python)
|
||||
#:use-module (gnu packages xml)
|
||||
#:use-module (gnu packages image))
|
||||
|
||||
(define-public ocrad
|
||||
|
@ -52,34 +64,71 @@ (define-public ocrad
|
|||
(license license:gpl3+)))
|
||||
|
||||
(define-public tesseract-ocr
|
||||
(package
|
||||
(name "tesseract-ocr")
|
||||
(version "3.04.01")
|
||||
(source
|
||||
(origin
|
||||
(method git-fetch)
|
||||
(uri (git-reference
|
||||
(url "https://github.com/tesseract-ocr/tesseract")
|
||||
(commit version)))
|
||||
(file-name (git-file-name name version))
|
||||
(sha256
|
||||
(base32 "0h1x4z1h86n2gwknd0wck6gykkp99bmm02lg4a47a698g4az6ybv"))))
|
||||
(build-system gnu-build-system)
|
||||
(inputs
|
||||
`(("leptonica" ,leptonica)))
|
||||
(arguments
|
||||
'(#:configure-flags
|
||||
(let ((leptonica (assoc-ref %build-inputs "leptonica")))
|
||||
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))))
|
||||
(home-page "https://github.com/tesseract-ocr/tesseract")
|
||||
(synopsis "Optical character recognition engine")
|
||||
(description
|
||||
"Tesseract is an optical character recognition (OCR) engine with very
|
||||
;; There are useful commits beyond the last official stable release.
|
||||
(let ((commit "97079fa353557af6df86fd20b5d2e0dff5d8d5df")
|
||||
(revision "1"))
|
||||
(package
|
||||
(name "tesseract-ocr")
|
||||
(version (git-version "4.1.1" revision commit))
|
||||
(source
|
||||
(origin
|
||||
(method git-fetch)
|
||||
(uri (git-reference
|
||||
(url "https://github.com/tesseract-ocr/tesseract")
|
||||
(commit commit)))
|
||||
(file-name (git-file-name name version))
|
||||
(sha256
|
||||
(base32
|
||||
"11137a4aaay7qp64vdjd83hz1l089nzi5a0ql0qgk8gn79pyhi98"))))
|
||||
(build-system gnu-build-system)
|
||||
(inputs
|
||||
`(("cairo" ,cairo)
|
||||
("icu" ,icu4c)
|
||||
("leptonica" ,leptonica)
|
||||
("pango" ,pango)
|
||||
("python-wrapper" ,python-wrapper)))
|
||||
(native-inputs
|
||||
`(("asciidoc" ,asciidoc)
|
||||
("autoconf" ,autoconf)
|
||||
("automake" ,automake)
|
||||
("docbook-xsl" ,docbook-xsl)
|
||||
("libarchive" ,libarchive)
|
||||
("libcurl" ,curl)
|
||||
("libtool" ,libtool)
|
||||
("libtiff" ,libtiff)
|
||||
("pkg-config" ,pkg-config)
|
||||
("xsltproc" ,libxslt)))
|
||||
(arguments
|
||||
`(#:configure-flags
|
||||
(let ((leptonica (assoc-ref %build-inputs "leptonica")))
|
||||
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))
|
||||
#:tests? #f ; Tests currently result in a segfault
|
||||
#:phases
|
||||
(modify-phases %standard-phases
|
||||
(add-after 'unpack 'fix-docbook
|
||||
(lambda* (#:key inputs #:allow-other-keys)
|
||||
;; Don't attempt to download XSL schema.
|
||||
(substitute* "doc/Makefile.am"
|
||||
(("http://docbook.sourceforge.net/release/xsl/current/manpages/docbook.xsl")
|
||||
(string-append (assoc-ref inputs "docbook-xsl")
|
||||
"/xml/xsl/docbook-xsl-"
|
||||
,(package-version docbook-xsl)
|
||||
"/manpages/docbook.xsl")))))
|
||||
(add-after 'install 'build-training
|
||||
(lambda _
|
||||
(invoke "make" "training")))
|
||||
(add-after 'build-training 'install-training
|
||||
(lambda _
|
||||
(invoke "make" "training-install"))))))
|
||||
(home-page "https://github.com/tesseract-ocr/tesseract")
|
||||
(synopsis "Optical character recognition engine")
|
||||
(description
|
||||
"Tesseract is an optical character recognition (OCR) engine with very
|
||||
high accuracy. It supports many languages, output text formatting, hOCR
|
||||
positional information and page layout analysis. Several image formats are
|
||||
supported through the Leptonica library. It can also detect whether text is
|
||||
monospaced or proportional.")
|
||||
(license license:asl2.0)))
|
||||
(license license:asl2.0))))
|
||||
|
||||
(define-public zinnia
|
||||
(let* ((commit "581faa8f6f15e4a7b21964be3a5ec36265c80e5b")
|
||||
|
@ -151,3 +200,4 @@ (define-public python2-zinnia
|
|||
#t)))))
|
||||
(inputs
|
||||
`(("zinnia" ,zinnia)))))
|
||||
|
||||
|
|
Loading…
Reference in a new issue