2013-08-18 18:52:49 -04:00
|
|
|
;;; GNU Guix --- Functional package management for GNU
|
|
|
|
;;; Copyright © 2013 Ludovic Courtès <ludo@gnu.org>
|
2020-03-29 14:02:15 -04:00
|
|
|
;;; Copyright © 2016, 2020 Efraim Flashner <efraim@flashner.co.il>
|
2019-01-20 10:27:04 -05:00
|
|
|
;;; Copyright © 2019 Tobias Geerinckx-Rice <me@tobias.gr>
|
2019-08-06 11:43:55 -04:00
|
|
|
;;; Copyright © 2019 Alex Vong <alexvong1995@gmail.com>
|
2021-02-10 02:44:06 -05:00
|
|
|
;;; Copyright © 2021 Andy Tai <atai@atai.org>
|
2022-02-07 12:12:36 -05:00
|
|
|
;;; Copyright © 2021, 2022 Nicolas Goaziou <mail@nicolasgoaziou.fr>
|
2013-08-18 18:52:49 -04:00
|
|
|
;;;
|
|
|
|
;;; This file is part of GNU Guix.
|
|
|
|
;;;
|
|
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
|
|
;;; under the terms of the GNU General Public License as published by
|
|
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
;;; your option) any later version.
|
|
|
|
;;;
|
|
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
;;; GNU General Public License for more details.
|
|
|
|
;;;
|
|
|
|
;;; You should have received a copy of the GNU General Public License
|
|
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2015-03-20 11:22:34 -04:00
|
|
|
(define-module (gnu packages ocr)
|
2015-03-21 15:11:56 -04:00
|
|
|
#:use-module ((guix licenses) #:prefix license:)
|
2013-08-18 18:52:49 -04:00
|
|
|
#:use-module (guix packages)
|
|
|
|
#:use-module (guix download)
|
2022-02-07 12:14:22 -05:00
|
|
|
#:use-module (guix gexp)
|
2019-08-06 11:43:55 -04:00
|
|
|
#:use-module (guix git-download)
|
2021-03-02 08:02:58 -05:00
|
|
|
#:use-module (guix build-system cmake)
|
2013-08-18 18:52:49 -04:00
|
|
|
#:use-module (guix build-system gnu)
|
2019-08-06 11:52:41 -04:00
|
|
|
#:use-module (guix build-system python)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages)
|
|
|
|
#:use-module (gnu packages autotools)
|
|
|
|
#:use-module (gnu packages backup)
|
|
|
|
#:use-module (gnu packages check)
|
2015-03-21 15:11:56 -04:00
|
|
|
#:use-module (gnu packages compression)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages curl)
|
2021-03-02 08:02:58 -05:00
|
|
|
#:use-module (gnu packages djvu)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages docbook)
|
|
|
|
#:use-module (gnu packages documentation)
|
2021-03-02 08:02:58 -05:00
|
|
|
#:use-module (gnu packages enchant)
|
|
|
|
#:use-module (gnu packages gettext)
|
|
|
|
#:use-module (gnu packages glib)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages gtk)
|
|
|
|
#:use-module (gnu packages icu4c)
|
2021-03-02 08:02:58 -05:00
|
|
|
#:use-module (gnu packages pdf)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages pkg-config)
|
2019-08-06 11:52:41 -04:00
|
|
|
#:use-module (gnu packages python)
|
2021-03-02 08:02:58 -05:00
|
|
|
#:use-module (gnu packages qt)
|
|
|
|
#:use-module (gnu packages scanner)
|
2021-02-10 02:44:06 -05:00
|
|
|
#:use-module (gnu packages xml)
|
2016-07-21 10:18:06 -04:00
|
|
|
#:use-module (gnu packages image))
|
2013-08-18 18:52:49 -04:00
|
|
|
|
|
|
|
(define-public ocrad
|
|
|
|
(package
|
|
|
|
(name "ocrad")
|
2019-01-20 10:27:04 -05:00
|
|
|
(version "0.27")
|
2013-08-18 18:52:49 -04:00
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
|
|
|
(uri (string-append "mirror://gnu/ocrad/ocrad-"
|
|
|
|
version ".tar.lz"))
|
|
|
|
(sha256
|
|
|
|
(base32
|
2019-01-20 10:27:04 -05:00
|
|
|
"0divffvcaim89g4pvqs8kslbcxi475bcl3b4ynphf284k9zfdgx9"))))
|
2013-08-18 18:52:49 -04:00
|
|
|
(build-system gnu-build-system)
|
2021-12-13 11:18:24 -05:00
|
|
|
(native-inputs (list lzip))
|
2017-03-29 18:48:16 -04:00
|
|
|
(home-page "https://www.gnu.org/software/ocrad/")
|
2013-08-18 18:52:49 -04:00
|
|
|
(synopsis "Optical character recognition based on feature extraction")
|
|
|
|
(description
|
2013-12-01 16:33:23 -05:00
|
|
|
"GNU Ocrad is an optical character recognition program based on a
|
|
|
|
feature extraction method. It can read images in PBM, PGM or PPM formats and
|
|
|
|
it produces text in 8-bit or UTF-8 formats.")
|
2015-03-21 15:11:56 -04:00
|
|
|
(license license:gpl3+)))
|
|
|
|
|
|
|
|
(define-public tesseract-ocr
|
2021-02-10 02:44:06 -05:00
|
|
|
;; There are useful commits beyond the last official stable release.
|
|
|
|
(let ((commit "97079fa353557af6df86fd20b5d2e0dff5d8d5df")
|
|
|
|
(revision "1"))
|
|
|
|
(package
|
|
|
|
(name "tesseract-ocr")
|
|
|
|
(version (git-version "4.1.1" revision commit))
|
|
|
|
(source
|
|
|
|
(origin
|
|
|
|
(method git-fetch)
|
|
|
|
(uri (git-reference
|
|
|
|
(url "https://github.com/tesseract-ocr/tesseract")
|
|
|
|
(commit commit)))
|
|
|
|
(file-name (git-file-name name version))
|
|
|
|
(sha256
|
|
|
|
(base32
|
|
|
|
"11137a4aaay7qp64vdjd83hz1l089nzi5a0ql0qgk8gn79pyhi98"))))
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
(inputs
|
|
|
|
`(("cairo" ,cairo)
|
|
|
|
("icu" ,icu4c)
|
|
|
|
("leptonica" ,leptonica)
|
|
|
|
("pango" ,pango)
|
|
|
|
("python-wrapper" ,python-wrapper)))
|
|
|
|
(native-inputs
|
|
|
|
`(("asciidoc" ,asciidoc)
|
|
|
|
("autoconf" ,autoconf)
|
|
|
|
("automake" ,automake)
|
|
|
|
("docbook-xsl" ,docbook-xsl)
|
|
|
|
("libarchive" ,libarchive)
|
|
|
|
("libcurl" ,curl)
|
|
|
|
("libtool" ,libtool)
|
|
|
|
("libtiff" ,libtiff)
|
|
|
|
("pkg-config" ,pkg-config)
|
|
|
|
("xsltproc" ,libxslt)))
|
|
|
|
(arguments
|
|
|
|
`(#:configure-flags
|
|
|
|
(let ((leptonica (assoc-ref %build-inputs "leptonica")))
|
|
|
|
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))
|
|
|
|
#:tests? #f ; Tests currently result in a segfault
|
|
|
|
#:phases
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
(add-after 'unpack 'fix-docbook
|
|
|
|
(lambda* (#:key inputs #:allow-other-keys)
|
|
|
|
;; Don't attempt to download XSL schema.
|
|
|
|
(substitute* "doc/Makefile.am"
|
|
|
|
(("http://docbook.sourceforge.net/release/xsl/current/manpages/docbook.xsl")
|
|
|
|
(string-append (assoc-ref inputs "docbook-xsl")
|
|
|
|
"/xml/xsl/docbook-xsl-"
|
|
|
|
,(package-version docbook-xsl)
|
|
|
|
"/manpages/docbook.xsl")))))
|
|
|
|
(add-after 'install 'build-training
|
|
|
|
(lambda _
|
|
|
|
(invoke "make" "training")))
|
|
|
|
(add-after 'build-training 'install-training
|
|
|
|
(lambda _
|
|
|
|
(invoke "make" "training-install"))))))
|
|
|
|
(home-page "https://github.com/tesseract-ocr/tesseract")
|
|
|
|
(synopsis "Optical character recognition engine")
|
|
|
|
(description
|
|
|
|
"Tesseract is an optical character recognition (OCR) engine with very
|
2015-03-21 15:11:56 -04:00
|
|
|
high accuracy. It supports many languages, output text formatting, hOCR
|
|
|
|
positional information and page layout analysis. Several image formats are
|
|
|
|
supported through the Leptonica library. It can also detect whether text is
|
|
|
|
monospaced or proportional.")
|
2021-02-10 02:44:06 -05:00
|
|
|
(license license:asl2.0))))
|
2019-08-06 11:43:55 -04:00
|
|
|
|
2021-03-02 08:02:58 -05:00
|
|
|
(define-public gimagereader
|
|
|
|
(package
|
|
|
|
(name "gimagereader")
|
2022-02-07 12:12:36 -05:00
|
|
|
(version "3.4.0")
|
2021-03-02 08:02:58 -05:00
|
|
|
(source
|
|
|
|
(origin
|
|
|
|
(method url-fetch)
|
|
|
|
(uri (string-append
|
|
|
|
"https://github.com/manisandro/gImageReader/releases"
|
|
|
|
"/download/v" version "/"
|
|
|
|
"gimagereader-" version ".tar.xz"))
|
|
|
|
(sha256
|
2022-02-07 12:12:36 -05:00
|
|
|
(base32 "09glxh7b4ivrd4samm67b8k2p0aljiagr83wb8nvy5ps2a9gwp5m"))))
|
2021-03-02 08:02:58 -05:00
|
|
|
(build-system cmake-build-system)
|
|
|
|
(arguments
|
2022-02-07 12:14:22 -05:00
|
|
|
(list
|
|
|
|
#:tests? #f ;no test
|
|
|
|
#:configure-flags #~(list "-DENABLE_VERSIONCHECK=0")))
|
2021-03-02 08:02:58 -05:00
|
|
|
(native-inputs
|
2022-02-07 12:13:36 -05:00
|
|
|
(list gettext-minimal intltool pkg-config))
|
2021-03-02 08:02:58 -05:00
|
|
|
(inputs
|
2022-02-07 12:13:36 -05:00
|
|
|
(list enchant
|
|
|
|
djvulibre
|
|
|
|
leptonica
|
|
|
|
podofo
|
|
|
|
poppler-qt5
|
|
|
|
sane-backends
|
|
|
|
qtbase-5
|
|
|
|
qtspell
|
|
|
|
quazip-0
|
|
|
|
tesseract-ocr))
|
2021-03-02 08:02:58 -05:00
|
|
|
(home-page "https://github.com/manisandro/gImageReader")
|
|
|
|
(synopsis "Qt front-end to tesseract-ocr")
|
|
|
|
(description
|
|
|
|
"gImageReader is a Qt front-end to Tesseract optical character
|
|
|
|
recognition (OCR) software.
|
|
|
|
|
|
|
|
gImageReader supports automatic page layout detection but the user can
|
|
|
|
also manually define and adjust the recognition regions. It is
|
|
|
|
possible to import images from disk, scanning devices, clipboard and
|
|
|
|
screenshots. gImageReader also supports multipage PDF documents.
|
|
|
|
Recognized text is displayed directly next to the image and basic text
|
|
|
|
editing including search/replace and removing of line breaks is
|
|
|
|
possible. Spellchecking for the output text is also supported if the
|
|
|
|
corresponding dictionaries are installed.")
|
|
|
|
(license license:gpl3+)))
|
|
|
|
|
2019-08-06 11:43:55 -04:00
|
|
|
(define-public zinnia
|
|
|
|
(let* ((commit "581faa8f6f15e4a7b21964be3a5ec36265c80e5b")
|
|
|
|
(revision "1")
|
|
|
|
;; version copied from 'configure.in'
|
|
|
|
(version (git-version "0.07" revision commit)))
|
|
|
|
(package
|
|
|
|
(name "zinnia")
|
|
|
|
(version version)
|
|
|
|
(source
|
|
|
|
(origin
|
|
|
|
(method git-fetch)
|
|
|
|
(uri (git-reference
|
gnu: Remove ".git" from "https://github/…/….git".
Until now, 'lookup-origin' and thus 'lookup-origin-revision' in (guix
swh) would sometimes return #f for these because the ".git" URLs are
redirects to the non-".git" URLs. Consequently, 'guix lint -c archival'
would keep saying "scheduled Software Heritage archival"; likewise, the
fallback download code would fail.
* gnu/packages/ada.scm,
gnu/packages/admin.scm,
gnu/packages/aidc.scm,
gnu/packages/algebra.scm,
gnu/packages/android.scm,
gnu/packages/animation.scm,
gnu/packages/arcan.scm,
gnu/packages/assembly.scm,
gnu/packages/audio.scm,
gnu/packages/authentication.scm,
gnu/packages/avr.scm,
gnu/packages/axoloti.scm,
gnu/packages/backup.scm,
gnu/packages/bash.scm,
gnu/packages/benchmark.scm,
gnu/packages/bioconductor.scm,
gnu/packages/bioinformatics.scm,
gnu/packages/bittorrent.scm,
gnu/packages/boost.scm,
gnu/packages/build-tools.scm,
gnu/packages/c.scm,
gnu/packages/calendar.scm,
gnu/packages/cdrom.scm,
gnu/packages/check.scm,
gnu/packages/chemistry.scm,
gnu/packages/chez.scm,
gnu/packages/clojure.scm,
gnu/packages/code.scm,
gnu/packages/compression.scm,
gnu/packages/compton.scm,
gnu/packages/coq.scm,
gnu/packages/cpp.scm,
gnu/packages/cran.scm,
gnu/packages/crypto.scm,
gnu/packages/curl.scm,
gnu/packages/databases.scm,
gnu/packages/datastructures.scm,
gnu/packages/debug.scm,
gnu/packages/disk.scm,
gnu/packages/distributed.scm,
gnu/packages/django.scm,
gnu/packages/dlang.scm,
gnu/packages/dns.scm,
gnu/packages/docker.scm,
gnu/packages/education.scm,
gnu/packages/efi.scm,
gnu/packages/elixir.scm,
gnu/packages/emacs-xyz.scm,
gnu/packages/embedded.scm,
gnu/packages/emulators.scm,
gnu/packages/engineering.scm,
gnu/packages/erlang.scm,
gnu/packages/fabric-management.scm,
gnu/packages/file-systems.scm,
gnu/packages/finance.scm,
gnu/packages/firmware.scm,
gnu/packages/flashing-tools.scm,
gnu/packages/fonts.scm,
gnu/packages/fontutils.scm,
gnu/packages/fpga.scm,
gnu/packages/game-development.scm,
gnu/packages/games.scm,
gnu/packages/genealogy.scm,
gnu/packages/genimage.scm,
gnu/packages/geo.scm,
gnu/packages/gimp.scm,
gnu/packages/gl.scm,
gnu/packages/gnome-xyz.scm,
gnu/packages/gnome.scm,
gnu/packages/gnuzilla.scm,
gnu/packages/golang.scm,
gnu/packages/gpodder.scm,
gnu/packages/graph.scm,
gnu/packages/graphics.scm,
gnu/packages/graphviz.scm,
gnu/packages/groff.scm,
gnu/packages/groovy.scm,
gnu/packages/gtk.scm,
gnu/packages/guile-xyz.scm,
gnu/packages/guile.scm,
gnu/packages/hardware.scm,
gnu/packages/haskell-apps.scm,
gnu/packages/haskell-xyz.scm,
gnu/packages/hexedit.scm,
gnu/packages/i2p.scm,
gnu/packages/ibus.scm,
gnu/packages/image-processing.scm,
gnu/packages/image-viewers.scm,
gnu/packages/image.scm,
gnu/packages/ipfs.scm,
gnu/packages/java-graphics.scm,
gnu/packages/java-maths.scm,
gnu/packages/java.scm,
gnu/packages/javascript.scm,
gnu/packages/jrnl.scm,
gnu/packages/julia.scm,
gnu/packages/jupyter.scm,
gnu/packages/kodi.scm,
gnu/packages/language.scm,
gnu/packages/lego.scm,
gnu/packages/less.scm,
gnu/packages/libusb.scm,
gnu/packages/linux.scm,
gnu/packages/lirc.scm,
gnu/packages/lisp-xyz.scm,
gnu/packages/llvm.scm,
gnu/packages/logging.scm,
gnu/packages/lolcode.scm,
gnu/packages/lua.scm,
gnu/packages/lxde.scm,
gnu/packages/lxqt.scm,
gnu/packages/machine-learning.scm,
gnu/packages/mail.scm,
gnu/packages/markup.scm,
gnu/packages/maths.scm,
gnu/packages/maven.scm,
gnu/packages/mes.scm,
gnu/packages/messaging.scm,
gnu/packages/monitoring.scm,
gnu/packages/mpd.scm,
gnu/packages/music.scm,
gnu/packages/networking.scm,
gnu/packages/node-xyz.scm,
gnu/packages/ocaml.scm,
gnu/packages/ocr.scm,
gnu/packages/onc-rpc.scm,
gnu/packages/opencl.scm,
gnu/packages/opencog.scm,
gnu/packages/pantheon.scm,
gnu/packages/password-utils.scm,
gnu/packages/patchutils.scm,
gnu/packages/pdf.scm,
gnu/packages/perl6.scm,
gnu/packages/phabricator.scm,
gnu/packages/popt.scm,
gnu/packages/printers.scm,
gnu/packages/prolog.scm,
gnu/packages/protobuf.scm,
gnu/packages/pulseaudio.scm,
gnu/packages/python-crypto.scm,
gnu/packages/python-web.scm,
gnu/packages/python-xyz.scm,
gnu/packages/qt.scm,
gnu/packages/radio.scm,
gnu/packages/rails.scm,
gnu/packages/rdf.scm,
gnu/packages/rednotebook.scm,
gnu/packages/rpc.scm,
gnu/packages/rsync.scm,
gnu/packages/ruby.scm,
gnu/packages/rust.scm,
gnu/packages/scheme.scm,
gnu/packages/screen.scm,
gnu/packages/security-token.scm,
gnu/packages/selinux.scm,
gnu/packages/serialization.scm,
gnu/packages/shells.scm,
gnu/packages/shellutils.scm,
gnu/packages/simh.scm,
gnu/packages/sml.scm,
gnu/packages/ssh.scm,
gnu/packages/statistics.scm,
gnu/packages/stenography.scm,
gnu/packages/sync.scm,
gnu/packages/syncthing.scm,
gnu/packages/synergy.scm,
gnu/packages/telephony.scm,
gnu/packages/terminals.scm,
gnu/packages/tex.scm,
gnu/packages/texinfo.scm,
gnu/packages/text-editors.scm,
gnu/packages/textutils.scm,
gnu/packages/time.scm,
gnu/packages/tmux.scm,
gnu/packages/tor.scm,
gnu/packages/toys.scm,
gnu/packages/version-control.scm,
gnu/packages/video.scm,
gnu/packages/vim.scm,
gnu/packages/virtualization.scm,
gnu/packages/vlang.scm,
gnu/packages/vnc.scm,
gnu/packages/vpn.scm,
gnu/packages/web-browsers.scm,
gnu/packages/web.scm,
gnu/packages/wireservice.scm,
gnu/packages/wm.scm,
gnu/packages/wxwidgets.scm,
gnu/packages/xdisorg.scm,
gnu/packages/xml.scm,
gnu/packages/xorg.scm,
tests/lint.scm: Remove trailing ".git" from 'git-reference' URL.
2020-07-12 16:53:28 -04:00
|
|
|
(url "https://github.com/taku910/zinnia")
|
2019-08-06 11:43:55 -04:00
|
|
|
(commit commit)))
|
|
|
|
(sha256
|
|
|
|
(base32
|
|
|
|
"1izjy5qw6swg0rs2ym2i72zndb90mwrfbd1iv8xbpwckbm4899lg"))
|
|
|
|
(file-name (git-file-name name version))
|
|
|
|
(modules '((guix build utils)
|
|
|
|
(ice-9 ftw)
|
|
|
|
(srfi srfi-26)))
|
|
|
|
(snippet ; remove unnecessary files with potentially different license
|
|
|
|
'(begin
|
|
|
|
(for-each delete-file-recursively
|
|
|
|
(scandir "."
|
|
|
|
(negate (cut member <> '("zinnia"
|
|
|
|
"." "..")))))
|
|
|
|
#t))))
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
(arguments
|
|
|
|
`(#:phases
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
(replace 'bootstrap
|
|
|
|
(lambda _
|
|
|
|
(chdir "zinnia")
|
|
|
|
(for-each make-file-writable
|
|
|
|
'("config.log" "config.status"))
|
|
|
|
#t)))))
|
|
|
|
(home-page "https://taku910.github.io/zinnia/")
|
|
|
|
(synopsis "Online hand recognition system with machine learning")
|
|
|
|
(description
|
|
|
|
"Zinnia is a simple, customizable and portable online hand recognition
|
|
|
|
system based on Support Vector Machines. Zinnia simply receives user pen
|
|
|
|
strokes as a sequence of coordinate data and outputs n-best characters sorted
|
|
|
|
by SVM confidence. To keep portability, Zinnia doesn't have any rendering
|
|
|
|
functionality. In addition to recognition, Zinnia provides training module
|
|
|
|
that allows us to create any hand-written recognition systems with low-cost.")
|
|
|
|
(license (list license:bsd-3 ; all files except...
|
|
|
|
(license:non-copyleft ; some autotools related files
|
|
|
|
"file://zinnia/aclocal.m4")
|
|
|
|
license:x11 ; 'install-sh'
|
|
|
|
license:public-domain))))) ; 'install-sh'
|
2019-08-06 11:52:41 -04:00
|
|
|
|
|
|
|
;;; python 2 bindings, license under the same terms as zinnia
|
|
|
|
(define-public python2-zinnia
|
|
|
|
(package
|
|
|
|
(inherit zinnia)
|
|
|
|
(name "python2-zinnia")
|
|
|
|
(build-system python-build-system)
|
|
|
|
(arguments
|
|
|
|
`(#:python ,python-2 ; CObject API is used, it was removed in Python 3.2
|
|
|
|
#:tests? #f ; avoid circular dependency on tegaki-zinnia-japanese
|
|
|
|
#:phases
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
(add-after 'unpack 'chdir
|
|
|
|
(lambda _
|
|
|
|
(chdir "zinnia/python")
|
|
|
|
#t)))))
|
|
|
|
(inputs
|
2021-12-13 11:18:24 -05:00
|
|
|
(list zinnia))))
|
2021-02-10 02:44:06 -05:00
|
|
|
|