gnu: Add catdoc.

* gnu/packages/textutils.scm (catdoc): New variable.
This commit is contained in:
Hartmut Goebel 2017-05-15 11:41:54 +02:00
parent 1edbdb0bfc
commit d0abaf8960
No known key found for this signature in database
GPG key ID: 634A8DFFD3F631DF

View file

@ -10,6 +10,7 @@
;;; Copyright © 2016 Marius Bakke <mbakke@fastmail.com>
;;; Copyright © 2017 Eric Bavier <bavier@member.fsf.org>
;;; Copyright © 2017 Rene Saavedra <rennes@openmailbox.org>
;;; Copyright © 2017 Hartmut Goebel <h.goebel@crazy-compilers.com>
;;;
;;; This file is part of GNU Guix.
;;;
@ -368,6 +369,45 @@ (define-public antiword
runs Word\".")
(license license:gpl2+)))
(define-public catdoc
(package
(name "catdoc")
(version "0.95")
(source (origin
(method url-fetch)
(uri (string-append "http://ftp.wagner.pp.ru/pub/catdoc/"
"catdoc-" version ".tar.gz"))
(sha256
(base32
"15h7v3bmwfk4z8r78xs5ih6vd0pskn0rj90xghvbzdjj0cc88jji"))))
(build-system gnu-build-system)
;; TODO: Also build `wordview` which requires `tk` make a separate
;; package for this.
(arguments
'(#:tests? #f ; There are no tests
#:configure-flags '("--disable-wordview")
#:phases
(modify-phases %standard-phases
(add-before 'install 'fix-install
(lambda* (#:key outputs #:allow-other-keys)
(let ((out (assoc-ref outputs "out")))
(mkdir-p (string-append out "/share/man/man1"))))))))
(home-page "http://www.wagner.pp.ru/~vitus/software/catdoc/")
(synopsis "MS-Word to TeX or plain text converter")
(description "@command{catdoc} extracts text from MS-Word files, trying to
preserve as many special printable characters as possible. It supports
everything up to Word-97. Also supported are MS Write documents and RTF files.
@command{catdoc} does not preserve complex word formatting, but it can
translate some non-ASCII characters into TeX escape codes. It's goal is to
extract plain text and allow you to read it and, probably, reformat with TeX,
according to TeXnical rules.
This package also provides @command{xls2csv}, which extracts data from Excel
spreadsheets and outputs it in comma-separated-value format, and
@command{catppt}, which extracts data from PowerPoint presentations.")
(license license:gpl2+)))
(define-public utfcpp
(package
(name "utfcpp")