2015-03-04 16:34:13 -05:00
|
|
|
|
;;; GNU Guix --- Functional package management for GNU
|
|
|
|
|
;;; Copyright © 2015 Taylan Ulrich Bayırlı/Kammer <taylanbayirli@gmail.com>
|
2016-01-03 00:41:49 -05:00
|
|
|
|
;;; Copyright © 2015, 2016 Ricardo Wurmus <rekado@elephly.net>
|
2016-02-15 07:11:13 -05:00
|
|
|
|
;;; Copyright © 2015, 2016 Ben Woodcroft <donttrustben@gmail.com>
|
2015-12-10 10:15:04 -05:00
|
|
|
|
;;; Copyright © 2015 Roel Janssen <roel@gnu.org>
|
2016-03-26 13:28:31 -04:00
|
|
|
|
;;; Copyright © 2016 Jelle Licht <jlicht@fsfe.org>
|
2016-05-07 13:16:39 -04:00
|
|
|
|
;;; Copyright © 2016 Alex Griffin <a@ajgrf.com>
|
2016-05-30 02:35:10 -04:00
|
|
|
|
;;; Copyright © 2016 Efraim Flashner <efraim@flashner.co.il>
|
2016-10-16 19:00:28 -04:00
|
|
|
|
;;; Copyright © 2016 ng0 <ng0@we.make.ritual.n0.is>
|
2016-10-12 18:24:42 -04:00
|
|
|
|
;;; Copyright © 2016 Marius Bakke <mbakke@fastmail.com>
|
2017-02-11 00:18:49 -05:00
|
|
|
|
;;; Copyright © 2017 Eric Bavier <bavier@member.fsf.org>
|
2017-03-23 14:29:26 -04:00
|
|
|
|
;;; Copyright © 2017 Rene Saavedra <rennes@openmailbox.org>
|
2017-05-15 05:41:54 -04:00
|
|
|
|
;;; Copyright © 2017 Hartmut Goebel <h.goebel@crazy-compilers.com>
|
2015-03-04 16:34:13 -05:00
|
|
|
|
;;;
|
|
|
|
|
;;; This file is part of GNU Guix.
|
|
|
|
|
;;;
|
|
|
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
|
|
|
;;; under the terms of the GNU General Public License as published by
|
|
|
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
|
;;; your option) any later version.
|
|
|
|
|
;;;
|
|
|
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
|
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
;;; GNU General Public License for more details.
|
|
|
|
|
;;;
|
|
|
|
|
;;; You should have received a copy of the GNU General Public License
|
|
|
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
|
|
(define-module (gnu packages textutils)
|
|
|
|
|
#:use-module ((guix licenses) #:prefix license:)
|
|
|
|
|
#:use-module (guix packages)
|
|
|
|
|
#:use-module (guix download)
|
|
|
|
|
#:use-module (guix git-download)
|
|
|
|
|
#:use-module (guix build-system gnu)
|
2016-01-03 00:41:49 -05:00
|
|
|
|
#:use-module (guix build-system cmake)
|
2016-05-07 13:16:39 -04:00
|
|
|
|
#:use-module (guix build-system trivial)
|
2016-05-30 02:35:10 -04:00
|
|
|
|
#:use-module (gnu packages)
|
2015-04-14 10:35:30 -04:00
|
|
|
|
#:use-module (gnu packages autotools)
|
2016-10-16 19:00:28 -04:00
|
|
|
|
#:use-module (gnu packages ncurses)
|
|
|
|
|
#:use-module (gnu packages perl)
|
|
|
|
|
#:use-module (gnu packages pkg-config)
|
2016-05-07 13:16:39 -04:00
|
|
|
|
#:use-module (gnu packages python)
|
2016-10-16 19:00:28 -04:00
|
|
|
|
#:use-module (gnu packages readline)
|
|
|
|
|
#:use-module (gnu packages slang)
|
2016-05-07 13:16:39 -04:00
|
|
|
|
#:use-module (gnu packages zip))
|
2015-03-04 16:34:13 -05:00
|
|
|
|
|
|
|
|
|
(define-public recode
|
|
|
|
|
(package
|
|
|
|
|
(name "recode")
|
|
|
|
|
;; Last beta release (3.7-beta2) is from 2008; last commit from Feb 2014.
|
|
|
|
|
;; So we use that commit instead.
|
|
|
|
|
(version "3.7.0.201402")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method git-fetch)
|
|
|
|
|
(uri (git-reference
|
|
|
|
|
(url "https://github.com/pinard/Recode.git")
|
|
|
|
|
(commit "2d7092a9999194fc0e9449717a8048c8d8e26c18")))
|
|
|
|
|
(sha256
|
2015-11-23 06:03:17 -05:00
|
|
|
|
(base32 "1wssv8z6g3ryrw33sksz4rjhlnhgvvdqszw1ggl4rcwks34n86zm"))
|
|
|
|
|
(file-name (string-append name "-" version "-checkout"))))
|
2015-03-04 16:34:13 -05:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(native-inputs `(("python" ,python-2)))
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:phases
|
|
|
|
|
(alist-cons-before
|
2015-04-15 00:04:51 -04:00
|
|
|
|
'check 'pre-check
|
2015-03-04 16:34:13 -05:00
|
|
|
|
(lambda _
|
|
|
|
|
(substitute* "tests/setup.py"
|
|
|
|
|
(("([[:space:]]*)include_dirs=.*" all space)
|
2015-04-15 00:04:51 -04:00
|
|
|
|
(string-append all space "library_dirs=['../src/.libs'],\n")))
|
|
|
|
|
;; The test extension 'Recode.so' lacks RUNPATH for 'librecode.so'.
|
|
|
|
|
(setenv "LD_LIBRARY_PATH" (string-append (getcwd) "/src/.libs")))
|
2015-03-04 16:34:13 -05:00
|
|
|
|
%standard-phases)))
|
|
|
|
|
(home-page "https://github.com/pinard/Recode")
|
|
|
|
|
(synopsis "Text encoding converter")
|
|
|
|
|
(description "The Recode library converts files between character sets and
|
|
|
|
|
usages. It recognises or produces over 200 different character sets (or about
|
|
|
|
|
300 if combined with an iconv library) and transliterates files between almost
|
|
|
|
|
any pair. When exact transliteration are not possible, it gets rid of
|
|
|
|
|
offending characters or falls back on approximations. The recode program is a
|
|
|
|
|
handy front-end to the library.")
|
|
|
|
|
(license license:gpl2+)))
|
2015-03-04 16:35:15 -05:00
|
|
|
|
|
|
|
|
|
(define-public enca
|
|
|
|
|
(package
|
|
|
|
|
(name "enca")
|
|
|
|
|
(version "1.16")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/nijel/enca/archive/" version ".tar.gz"))
|
|
|
|
|
(sha256
|
2015-11-23 07:46:31 -05:00
|
|
|
|
(base32 "1xik00x0yvhswsw2isnclabhv536xk1s42cf5z54gfbpbhc7ni8l"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))))
|
2015-03-04 16:35:15 -05:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(inputs `(("recode" ,recode)))
|
2015-03-10 09:18:19 -04:00
|
|
|
|
|
|
|
|
|
;; Both 'test-convert-64.sh' and 'test-convert-filter.sh' manipulate a
|
|
|
|
|
;; 'test.tmp' file, so they have to run in sequence.
|
|
|
|
|
(arguments '(#:parallel-tests? #f))
|
|
|
|
|
|
2015-03-04 16:35:15 -05:00
|
|
|
|
(home-page "https://github.com/nijel/enca")
|
|
|
|
|
(synopsis "Text encoding detection tool")
|
|
|
|
|
(description "Enca (Extremely Naive Charset Analyser) consists of libenca,
|
|
|
|
|
an encoding detection library, and enca, a command line frontend, integrating
|
|
|
|
|
libenca and several charset conversion libraries and tools.")
|
|
|
|
|
(license license:gpl2)))
|
2015-03-19 12:06:06 -04:00
|
|
|
|
|
|
|
|
|
(define-public utf8proc
|
|
|
|
|
(package
|
|
|
|
|
(name "utf8proc")
|
2017-02-10 22:06:57 -05:00
|
|
|
|
(version "2.1.0")
|
2015-03-19 12:06:06 -04:00
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/JuliaLang/utf8proc/archive/v"
|
|
|
|
|
version ".tar.gz"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
2017-02-10 22:06:57 -05:00
|
|
|
|
(base32 "0q1jhdkk4f9b0zb8s2ql3sba3br5nvjsmbsaybmgj064k9hwbk15"))))
|
2015-03-19 12:06:06 -04:00
|
|
|
|
(build-system gnu-build-system)
|
2017-02-11 00:18:49 -05:00
|
|
|
|
(inputs ;test data that is otherwise downloaded with curl
|
|
|
|
|
`(("NormalizationTest.txt"
|
|
|
|
|
,(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.unicode.org/Public/9.0.0/ucd/"
|
|
|
|
|
"NormalizationTest.txt"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32 "1fxrz0bilsbwl685336aqi88k62i6nqhm62rvy4zhg3bcm4dhj1d"))))
|
|
|
|
|
("GraphemeBreakTest.txt"
|
|
|
|
|
,(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.unicode.org/Public/9.0.0/ucd/"
|
|
|
|
|
"auxiliary/GraphemeBreakTest.txt"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32 "0qbhyhmf0778lc2hcwlpizrvmdxwpk959v2q2wb8abv09ba7wvn7"))))))
|
2015-03-19 12:06:06 -04:00
|
|
|
|
(arguments
|
2017-02-11 00:18:49 -05:00
|
|
|
|
'(#:make-flags (list "CC=gcc"
|
2015-11-30 08:31:02 -05:00
|
|
|
|
(string-append "prefix=" (assoc-ref %outputs "out")))
|
2015-03-19 12:06:06 -04:00
|
|
|
|
#:phases
|
2015-11-30 08:31:02 -05:00
|
|
|
|
(modify-phases %standard-phases
|
2017-02-11 00:18:49 -05:00
|
|
|
|
(delete 'configure)
|
|
|
|
|
(add-before 'check 'check-data
|
|
|
|
|
(lambda* (#:key inputs #:allow-other-keys)
|
|
|
|
|
(for-each (lambda (i)
|
|
|
|
|
(copy-file (assoc-ref inputs i)
|
|
|
|
|
(string-append "data/" i)))
|
|
|
|
|
'("NormalizationTest.txt" "GraphemeBreakTest.txt"))
|
|
|
|
|
(substitute* "data/GraphemeBreakTest.txt"
|
|
|
|
|
(("÷") "/")
|
|
|
|
|
(("×") "+")))))))
|
2015-03-19 12:06:06 -04:00
|
|
|
|
(home-page "http://julialang.org/utf8proc/")
|
|
|
|
|
(synopsis "C library for processing UTF-8 Unicode data")
|
|
|
|
|
(description "utf8proc is a small C library that provides Unicode
|
|
|
|
|
normalization, case-folding, and other operations for data in the UTF-8
|
2016-09-25 05:00:05 -04:00
|
|
|
|
encoding, supporting Unicode version 9.0.0.")
|
2015-03-19 12:06:06 -04:00
|
|
|
|
(license license:expat)))
|
2015-04-14 10:35:30 -04:00
|
|
|
|
|
|
|
|
|
(define-public libgtextutils
|
|
|
|
|
(package
|
|
|
|
|
(name "libgtextutils")
|
|
|
|
|
(version "0.7")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/agordon/libgtextutils/releases/download/"
|
|
|
|
|
version "/libgtextutils-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32 "0jiybkb2z58wa2msvllnphr4js2hvjvh988pavb3mzkgr6ihwbkr"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:phases
|
|
|
|
|
(alist-cons-after
|
|
|
|
|
'unpack 'autoreconf
|
|
|
|
|
(lambda _ (zero? (system* "autoreconf" "-vif")))
|
|
|
|
|
%standard-phases)))
|
|
|
|
|
(native-inputs
|
|
|
|
|
`(("autoconf" ,autoconf)
|
|
|
|
|
("automake" ,automake)
|
|
|
|
|
("libtool" ,libtool)))
|
|
|
|
|
(home-page "https://github.com/agordon/libgtextutils")
|
|
|
|
|
(synopsis "Gordon's text utils library")
|
|
|
|
|
(description
|
|
|
|
|
"libgtextutils is a text utilities library used by the fastx toolkit from
|
|
|
|
|
the Hannon Lab.")
|
|
|
|
|
(license license:agpl3+)))
|
2015-09-29 08:10:33 -04:00
|
|
|
|
|
|
|
|
|
(define-public cityhash
|
2016-02-15 07:11:13 -05:00
|
|
|
|
(let ((commit "8af9b8c"))
|
2015-09-29 08:10:33 -04:00
|
|
|
|
(package
|
|
|
|
|
(name "cityhash")
|
2016-02-15 07:11:13 -05:00
|
|
|
|
(version (string-append "1.1-2." commit))
|
2015-09-29 08:10:33 -04:00
|
|
|
|
(source (origin
|
|
|
|
|
(method git-fetch)
|
|
|
|
|
(uri (git-reference
|
|
|
|
|
(url "https://github.com/google/cityhash.git")
|
|
|
|
|
(commit commit)))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"0n6skf5dv8yfl1ckax8dqhvsbslkwc9158zf2ims0xqdvzsahbi6"))))
|
2016-02-15 07:11:13 -05:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:make-flags (list "CXXFLAGS=-g -O3")
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
;; citycrc is not installed by default but is used by some
|
|
|
|
|
;; programs.
|
|
|
|
|
(add-after 'install 'install-citycrc
|
|
|
|
|
(lambda* (#:key outputs #:allow-other-keys)
|
|
|
|
|
(let* ((out (assoc-ref outputs "out"))
|
|
|
|
|
(include (string-append out "/include")))
|
|
|
|
|
(install-file "src/citycrc.h" include))
|
|
|
|
|
#t)))))
|
|
|
|
|
(home-page "https://github.com/google/cityhash")
|
|
|
|
|
(synopsis "C++ hash functions for strings")
|
|
|
|
|
(description
|
|
|
|
|
"CityHash provides hash functions for strings. The functions mix the
|
2015-09-29 08:10:33 -04:00
|
|
|
|
input bits thoroughly but are not suitable for cryptography.")
|
2016-02-15 07:11:13 -05:00
|
|
|
|
(license license:expat))))
|
2015-12-10 10:15:04 -05:00
|
|
|
|
|
2016-03-17 08:08:30 -04:00
|
|
|
|
(define-public ustr
|
|
|
|
|
(package
|
|
|
|
|
(name "ustr")
|
|
|
|
|
(version "1.0.4")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.and.org/ustr/" version
|
|
|
|
|
"/ustr-" version ".tar.bz2"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
2017-03-23 14:29:26 -04:00
|
|
|
|
"1i623ygdj7rkizj7985q9d6vj5amwg686aqb5j3ixpkqkyp6xbrx"))
|
|
|
|
|
(patches (search-patches "ustr-fix-build-with-gcc-5.patch"))))
|
2016-03-17 08:08:30 -04:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
`(#:make-flags
|
|
|
|
|
(list "CC=gcc"
|
|
|
|
|
"HIDE="
|
|
|
|
|
;; Override "/sbin/ldconfig" with "echo" because we don't need
|
|
|
|
|
;; "ldconfig".
|
|
|
|
|
"LDCONFIG=echo"
|
|
|
|
|
(string-append "prefix=" (assoc-ref %outputs "out"))
|
|
|
|
|
"all-shared")
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(add-after 'unpack 'disable-check-for-stdint
|
|
|
|
|
(lambda _
|
|
|
|
|
;; Of course we have stdint.h, just not in /usr/include
|
|
|
|
|
(substitute* '("Makefile"
|
|
|
|
|
"ustr-import.in")
|
|
|
|
|
(("-f \"/usr/include/stdint.h\"") "-z \"\""))
|
|
|
|
|
#t))
|
|
|
|
|
;; No configure script
|
|
|
|
|
(delete 'configure))))
|
|
|
|
|
(home-page "http://www.and.org/ustr/")
|
|
|
|
|
(synopsis "String library with very low memory overhead")
|
|
|
|
|
(description
|
|
|
|
|
"Ustr is a string library for C with very low memory overhead.")
|
|
|
|
|
;; Quoted from the home page: "The License for the code is MIT, new-BSD,
|
|
|
|
|
;; LGPL, etc. ... if you need another license to help compatibility, just
|
|
|
|
|
;; ask for it. It's basically public domain, without all the legal
|
|
|
|
|
;; problems for everyone that trying to make something public domain
|
|
|
|
|
;; entails."
|
|
|
|
|
(license license:public-domain)))
|
|
|
|
|
|
2015-12-10 10:15:04 -05:00
|
|
|
|
(define-public libconfig
|
|
|
|
|
(package
|
|
|
|
|
(name "libconfig")
|
|
|
|
|
(version "1.5")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.hyperrealm.com/libconfig/"
|
|
|
|
|
"libconfig-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"1xh3hzk63v4y8815lc5209m3s6ms2cpgw4h5hg462i4f1lwsl7g3"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(home-page "http://www.hyperrealm.com/libconfig/")
|
|
|
|
|
(synopsis "C/C++ configuration file library")
|
|
|
|
|
(description
|
|
|
|
|
"Libconfig is a simple library for manipulating structured configuration
|
|
|
|
|
files. This file format is more compact and more readable than XML. And
|
|
|
|
|
unlike XML, it is type-aware, so it is not necessary to do string parsing in
|
|
|
|
|
application code.")
|
|
|
|
|
(license license:lgpl2.1+)))
|
2016-01-03 00:41:49 -05:00
|
|
|
|
|
|
|
|
|
(define-public pfff
|
|
|
|
|
(package
|
|
|
|
|
(name "pfff")
|
|
|
|
|
(version "1.0")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "https://github.com/pfff/pfff/archive/v"
|
|
|
|
|
version ".tar.gz"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"00m553aa277iarxj6dalmklyb64r7ias49bfwzbacsfg8h3kar8m"))))
|
|
|
|
|
(build-system cmake-build-system)
|
|
|
|
|
(home-page "http://biit.cs.ut.ee/pfff/")
|
|
|
|
|
(synopsis "Probabilistic fast file fingerprinting tool")
|
|
|
|
|
(description
|
|
|
|
|
"pfff is a tool for calculating a compact digital fingerprint of a file
|
|
|
|
|
by sampling randomly from the file instead of reading it in full.
|
|
|
|
|
Consequently, the computation has a flat performance characteristic,
|
|
|
|
|
correlated with data variation rather than file size. pfff can be as reliable
|
|
|
|
|
as existing hashing techniques, with provably negligible risk of collisions.")
|
|
|
|
|
(license license:bsd-3)))
|
2016-03-26 13:28:31 -04:00
|
|
|
|
|
|
|
|
|
(define-public oniguruma
|
|
|
|
|
(package
|
|
|
|
|
(name "oniguruma")
|
|
|
|
|
(version "5.9.6")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "https://github.com/kkos/"
|
|
|
|
|
"oniguruma/releases/download/v" version
|
|
|
|
|
"/onig-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"19s79vsclqn170mw0ajwv7j37qsbn4f1yjz3yavnhvva6c820r6m"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(home-page "https://github.com/kkos/oniguruma")
|
|
|
|
|
(synopsis "Regular expression library")
|
|
|
|
|
(description "Oniguruma is a regular expressions library. The special
|
|
|
|
|
characteristic of this library is that different character encoding for every
|
|
|
|
|
regular expression object can be specified.")
|
|
|
|
|
(license license:bsd-2)))
|
2016-04-28 02:11:05 -04:00
|
|
|
|
|
|
|
|
|
(define-public antiword
|
|
|
|
|
(package
|
|
|
|
|
(name "antiword")
|
|
|
|
|
(version "0.37")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.winfield.demon.nl/linux"
|
|
|
|
|
"/antiword-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
2016-05-30 02:35:10 -04:00
|
|
|
|
"1b7mi1l20jhj09kyh0bq14qzz8vdhhyf35gzwsq43mn6rc7h0b4f"))
|
|
|
|
|
(patches (search-patches "antiword-CVE-2014-8123.patch"))))
|
2016-04-28 02:11:05 -04:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
`(#:tests? #f ; There are no tests
|
|
|
|
|
#:make-flags
|
|
|
|
|
(list "-f" "Makefile.Linux"
|
|
|
|
|
(string-append "GLOBAL_INSTALL_DIR="
|
|
|
|
|
(assoc-ref %outputs "out") "/bin")
|
|
|
|
|
(string-append "GLOBAL_RESOURCES_DIR="
|
|
|
|
|
(assoc-ref %outputs "out") "/share/antiword"))
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(delete 'configure)
|
|
|
|
|
(replace 'install
|
|
|
|
|
(lambda* (#:key make-flags #:allow-other-keys)
|
|
|
|
|
(zero? (apply system* "make" `("global_install" ,@make-flags))))))))
|
|
|
|
|
(home-page "http://www.winfield.demon.nl/")
|
|
|
|
|
(synopsis "Microsoft Word document reader")
|
|
|
|
|
(description "Antiword is an application for displaying Microsoft Word
|
|
|
|
|
documents. It can also convert the document to PostScript or XML. Only
|
|
|
|
|
documents made by MS Word version 2 and version 6 or later are supported. The
|
|
|
|
|
name comes from: \"The antidote against people who send Microsoft Word files
|
|
|
|
|
to everybody, because they believe that everybody runs Windows and therefore
|
|
|
|
|
runs Word\".")
|
|
|
|
|
(license license:gpl2+)))
|
2016-05-07 13:16:39 -04:00
|
|
|
|
|
2017-05-15 05:41:54 -04:00
|
|
|
|
(define-public catdoc
|
|
|
|
|
(package
|
|
|
|
|
(name "catdoc")
|
|
|
|
|
(version "0.95")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://ftp.wagner.pp.ru/pub/catdoc/"
|
|
|
|
|
"catdoc-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"15h7v3bmwfk4z8r78xs5ih6vd0pskn0rj90xghvbzdjj0cc88jji"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
;; TODO: Also build `wordview` which requires `tk` – make a separate
|
|
|
|
|
;; package for this.
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:tests? #f ; There are no tests
|
|
|
|
|
#:configure-flags '("--disable-wordview")
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(add-before 'install 'fix-install
|
|
|
|
|
(lambda* (#:key outputs #:allow-other-keys)
|
|
|
|
|
(let ((out (assoc-ref outputs "out")))
|
|
|
|
|
(mkdir-p (string-append out "/share/man/man1"))))))))
|
|
|
|
|
(home-page "http://www.wagner.pp.ru/~vitus/software/catdoc/")
|
|
|
|
|
(synopsis "MS-Word to TeX or plain text converter")
|
|
|
|
|
(description "@command{catdoc} extracts text from MS-Word files, trying to
|
|
|
|
|
preserve as many special printable characters as possible. It supports
|
|
|
|
|
everything up to Word-97. Also supported are MS Write documents and RTF files.
|
|
|
|
|
|
|
|
|
|
@command{catdoc} does not preserve complex word formatting, but it can
|
|
|
|
|
translate some non-ASCII characters into TeX escape codes. It's goal is to
|
|
|
|
|
extract plain text and allow you to read it and, probably, reformat with TeX,
|
|
|
|
|
according to TeXnical rules.
|
|
|
|
|
|
|
|
|
|
This package also provides @command{xls2csv}, which extracts data from Excel
|
|
|
|
|
spreadsheets and outputs it in comma-separated-value format, and
|
|
|
|
|
@command{catppt}, which extracts data from PowerPoint presentations.")
|
|
|
|
|
(license license:gpl2+)))
|
|
|
|
|
|
2016-05-07 13:16:39 -04:00
|
|
|
|
(define-public utfcpp
|
|
|
|
|
(package
|
|
|
|
|
(name "utfcpp")
|
|
|
|
|
(version "2.3.4")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri
|
|
|
|
|
(string-append
|
2016-07-22 11:45:03 -04:00
|
|
|
|
"mirror://sourceforge/utfcpp/utf8cpp_2x/Release%20"
|
2016-05-07 13:16:39 -04:00
|
|
|
|
version "/utf8_v"
|
|
|
|
|
(string-map (lambda (x) (if (eq? x #\.) #\_ x)) version)
|
|
|
|
|
".zip"))
|
|
|
|
|
(file-name (string-append name "-" version ".zip"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"1vqhs0aipcvvdrwcs7h3jsryg6mgbmc4s34n5cm6d36q4nxwwwrk"))))
|
|
|
|
|
(build-system trivial-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
`(#:modules ((guix build utils))
|
|
|
|
|
#:builder
|
|
|
|
|
(begin
|
|
|
|
|
(use-modules (guix build utils))
|
|
|
|
|
(let ((source (assoc-ref %build-inputs "source"))
|
|
|
|
|
(out (assoc-ref %outputs "out"))
|
|
|
|
|
(unzip (string-append (assoc-ref %build-inputs "unzip")
|
|
|
|
|
"/bin/unzip")))
|
|
|
|
|
(mkdir-p out)
|
|
|
|
|
(with-directory-excursion out
|
|
|
|
|
(system* unzip source)
|
|
|
|
|
(mkdir-p "share/doc")
|
|
|
|
|
(rename-file "doc" "share/doc/utfcpp")
|
|
|
|
|
(rename-file "source" "include"))))))
|
|
|
|
|
(native-inputs `(("unzip" ,unzip)))
|
|
|
|
|
(home-page "https://github.com/nemtrif/utfcpp")
|
|
|
|
|
(synopsis "Portable C++ library for handling UTF-8")
|
|
|
|
|
(description "UTF8-CPP is a C++ library for handling UTF-8 encoded text
|
|
|
|
|
in a portable way.")
|
|
|
|
|
(license license:boost1.0)))
|
2016-10-16 19:00:28 -04:00
|
|
|
|
|
|
|
|
|
(define-public dbacl
|
|
|
|
|
(package
|
|
|
|
|
(name "dbacl")
|
|
|
|
|
(version "1.14")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.lbreyer.com/gpl/"
|
|
|
|
|
name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"0224g6x71hyvy7jikfxmgcwww1r5lvk0jx36cva319cb9nmrbrq7"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
`(#:make-flags
|
|
|
|
|
(list
|
|
|
|
|
(string-append "-I" (assoc-ref %build-inputs "slang")
|
|
|
|
|
"/include/slang")
|
|
|
|
|
(string-append "-I" (assoc-ref %build-inputs "ncurses")
|
|
|
|
|
"/include/ncurses"))
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(add-after 'unpack 'delete-sample6-and-japanese
|
|
|
|
|
(lambda _
|
|
|
|
|
(substitute* "doc/Makefile.am"
|
|
|
|
|
(("sample6.txt") "")
|
|
|
|
|
(("japanese.txt") ""))
|
|
|
|
|
(delete-file "doc/sample6.txt")
|
|
|
|
|
(delete-file "doc/japanese.txt")
|
|
|
|
|
(substitute* (list "src/tests/Makefile.am"
|
|
|
|
|
"src/tests/Makefile.in")
|
|
|
|
|
(("dbacl-jap.shin") "")
|
|
|
|
|
(("dbacl-jap.sh") ""))
|
|
|
|
|
#t))
|
|
|
|
|
(add-after 'unpack 'delete-test
|
|
|
|
|
;; See comments about the license.
|
|
|
|
|
(lambda _
|
|
|
|
|
(delete-file "src/tests/dbacl-jap.shin")))
|
|
|
|
|
(add-after 'delete-sample6-and-japanese 'autoreconf
|
|
|
|
|
(lambda _
|
|
|
|
|
(zero? (system* "autoreconf" "-vif"))))
|
|
|
|
|
(add-after 'unpack 'fix-test-files
|
|
|
|
|
(lambda* (#:key inputs outputs #:allow-other-keys)
|
|
|
|
|
(let* ((out (assoc-ref outputs "out"))
|
|
|
|
|
(bin (string-append out "/bin")))
|
|
|
|
|
(substitute* (find-files "src/tests/" "\\.shin$")
|
|
|
|
|
(("PATH=/bin:/usr/bin")
|
|
|
|
|
"#PATH=/bin:/usr/bin")
|
|
|
|
|
(("diff") (string-append (which "diff")))
|
|
|
|
|
(("tr") (string-append (which "tr"))))
|
|
|
|
|
#t))))))
|
|
|
|
|
(inputs
|
|
|
|
|
`(("ncurses" ,ncurses)
|
|
|
|
|
("perl" ,perl)
|
|
|
|
|
("readline" ,readline)
|
|
|
|
|
("slang" ,slang)))
|
|
|
|
|
(native-inputs
|
|
|
|
|
`(("libtool" ,libtool)
|
|
|
|
|
("autoconf" ,autoconf)
|
|
|
|
|
("automake" ,automake)
|
|
|
|
|
("pkg-config" ,pkg-config)))
|
|
|
|
|
(home-page "http://www.lbreyer.com/dbacl.html")
|
|
|
|
|
(synopsis "Bayesian text and email classifier")
|
|
|
|
|
(description
|
|
|
|
|
"dbacl is a fast Bayesian text and email classifier. It builds a variety
|
|
|
|
|
of language models using maximum entropy (minimum divergence) principles, and
|
|
|
|
|
these can then be used to categorize input data automatically among multiple
|
|
|
|
|
categories.")
|
|
|
|
|
;; The software is licensed as GPLv3 or later, but
|
|
|
|
|
;; includes various sample texts in the doc dir:
|
|
|
|
|
;; - sample1.txt, sample3 and sampe5.txt are in the public domain,
|
|
|
|
|
;; by Mark Twain.
|
|
|
|
|
;; - sample2.txt, sample4.txt are in the public domain, by Aristotle.
|
|
|
|
|
;; - sample6.txt is a forwarded email, copyright unknown.
|
|
|
|
|
;; Guix does exclude sample6.txt.
|
|
|
|
|
;; - japanese.txt is a Japanese unoffical translation of the
|
|
|
|
|
;; GNU General Public License, (c) by the Free Software Foundation.
|
|
|
|
|
;; Guix excludes this file.
|
|
|
|
|
(license (list license:gpl3+ license:public-domain))))
|
2016-10-12 18:24:42 -04:00
|
|
|
|
|
|
|
|
|
(define-public dotconf
|
|
|
|
|
(package
|
|
|
|
|
(name "dotconf")
|
|
|
|
|
(version "1.3")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/williamh/dotconf/archive/v"
|
|
|
|
|
version ".tar.gz"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"0lsnh0yaw44psmx59hq94cj1932gscp5h8d3cnh05l0svr0cy7kz"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
`(#:tests? #f ; FIXME maketest.sh does not work.
|
|
|
|
|
#:phases
|
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(add-before 'configure 'autoreconf
|
|
|
|
|
(lambda _
|
|
|
|
|
(zero? (system* "autoreconf" "-vif")))))))
|
|
|
|
|
(native-inputs
|
|
|
|
|
`(("autoconf" ,autoconf)
|
|
|
|
|
("automake" ,automake)
|
|
|
|
|
("libtool" ,libtool)))
|
|
|
|
|
(home-page "https://github.com/williamh/dotconf")
|
|
|
|
|
(synopsis "Configuration file parser library")
|
|
|
|
|
(description
|
|
|
|
|
"C library for creating and parsing configuration files.")
|
|
|
|
|
(license (list license:lgpl2.1 ; Main distribution.
|
|
|
|
|
license:asl1.1)))) ; src/readdir.{c,h}
|