mirror of
https://git.in.rschanz.org/ryan77627/guix.git
synced 2024-12-30 16:12:58 -05:00
35e4e3597f
* gnu/packages/language.scm (perl-lingua-en-tagger): Update to 0.30.
408 lines
16 KiB
Scheme
408 lines
16 KiB
Scheme
;;; GNU Guix --- Functional package management for GNU
|
|
;;; Copyright © 2015, 2016 Eric Bavier <bavier@member.fsf.org>
|
|
;;; Copyright © 2017, 2018 Tobias Geerinckx-Rice <me@tobias.gr>
|
|
;;; Copyright © 2018 ng0 <ng0@n0.is>
|
|
;;;
|
|
;;; This file is part of GNU Guix.
|
|
;;;
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
;;; under the terms of the GNU General Public License as published by
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
;;; your option) any later version.
|
|
;;;
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
;;; GNU General Public License for more details.
|
|
;;;
|
|
;;; You should have received a copy of the GNU General Public License
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
(define-module (gnu packages language)
|
|
#:use-module (gnu packages)
|
|
#:use-module (gnu packages perl)
|
|
#:use-module (gnu packages perl-check)
|
|
#:use-module (gnu packages web)
|
|
#:use-module (guix packages)
|
|
#:use-module (guix build-system perl)
|
|
#:use-module ((guix licenses) #:select (gpl2 gpl3 perl-license))
|
|
#:use-module (guix download))
|
|
|
|
(define-public perl-lingua-en-findnumber
|
|
(package
|
|
(name "perl-lingua-en-findnumber")
|
|
(version "1.32")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/"
|
|
"Lingua-EN-FindNumber-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"015ximzdp42v824llwlg2pd77vd0d172lb4xs55q9f9zhqf6s5qx"))))
|
|
(build-system perl-build-system)
|
|
(propagated-inputs
|
|
`(("perl-lingua-en-words2nums" ,perl-lingua-en-words2nums)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-FindNumber")
|
|
(synopsis "Locate (written) numbers in English text ")
|
|
(description "This module provides a regular expression for finding
|
|
numbers in English text. It also provides functions for extracting and
|
|
manipulating such numbers.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-en-inflect
|
|
(package
|
|
(name "perl-lingua-en-inflect")
|
|
(version "1.903")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/D/DC/DCONWAY/"
|
|
"Lingua-EN-Inflect-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0j8d1f1wvmgc11d71pc8xp8fv5a1nb2yfw1dgd19xhscn1klpvzw"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs `(("perl-module-build" ,perl-module-build)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Inflect")
|
|
(synopsis "Convert singular to plural")
|
|
(description "Lingua::EN::Inflect provides plural inflections,
|
|
\"a\"/\"an\" selection for English words, and manipulation of numbers as
|
|
words. Plural forms of all nouns, most verbs, and some adjectives are
|
|
provided. Where appropriate, \"classical\" variants (for example: \"brother\"
|
|
-> \"brethren\", \"dogma\" -> \"dogmata\", etc.) are also provided.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-en-inflect-number
|
|
(package
|
|
(name "perl-lingua-en-inflect-number")
|
|
(version "1.12")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/"
|
|
"Lingua-EN-Inflect-Number-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1gxccynkaqav43ww43jp4rzkyr36x97jd03yb5f6yx0jhn1k7yv6"))))
|
|
(build-system perl-build-system)
|
|
(propagated-inputs
|
|
`(("perl-lingua-en-inflect" ,perl-lingua-en-inflect)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Inflect-Number")
|
|
(synopsis "Force number of words to singular or plural")
|
|
(description "This module extends the functionality of Lingua::EN::Inflect
|
|
with three new functions for determining plurality of a word and forcefully
|
|
converting a word to singular or plural.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-en-inflect-phrase
|
|
(package
|
|
(name "perl-lingua-en-inflect-phrase")
|
|
(version "0.20")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/"
|
|
"Lingua-EN-Inflect-Phrase-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1a6y1l2pjim2242wcpgz066di4pbzfgsjjdl7vg5a5wzm48qj1am"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs
|
|
`(("perl-test-nowarnings" ,perl-test-nowarnings)))
|
|
(propagated-inputs
|
|
`(("perl-lingua-en-findnumber" ,perl-lingua-en-findnumber)
|
|
("perl-lingua-en-inflect" ,perl-lingua-en-inflect)
|
|
("perl-lingua-en-inflect-number" ,perl-lingua-en-inflect-number)
|
|
("perl-lingua-en-number-isordinal" ,perl-lingua-en-number-isordinal)
|
|
("perl-lingua-en-tagger" ,perl-lingua-en-tagger)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Inflect-Phrase")
|
|
(synopsis "Inflect short English phrases")
|
|
(description "This module attempts to pluralize or singularize short
|
|
English phrases.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-en-number-isordinal
|
|
(package
|
|
(name "perl-lingua-en-number-isordinal")
|
|
(version "0.05")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/"
|
|
"Lingua-EN-Number-IsOrdinal-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1mhqjvh2ad30gjab5b3a6mbr4aysyrscp4wp42yy5x6001a6km98"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs
|
|
`(("perl-try-tiny" ,perl-try-tiny)
|
|
("perl-test-fatal" ,perl-test-fatal)))
|
|
(propagated-inputs
|
|
`(("perl-lingua-en-findnumber" ,perl-lingua-en-findnumber)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Number-IsOrdinal")
|
|
(synopsis "Detect if English number is ordinal or cardinal")
|
|
(description "This module will tell you if a number, either in words or as
|
|
digits, is a cardinal or ordinal number.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-en-tagger
|
|
(package
|
|
(name "perl-lingua-en-tagger")
|
|
(version "0.30")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/A/AC/ACOBURN/"
|
|
"Lingua-EN-Tagger-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0nrnkvsf9f0a7lp82sanmy89ms2nqq1lvjqicvsagsvzp513bl5b"))))
|
|
(build-system perl-build-system)
|
|
(propagated-inputs
|
|
`(("perl-memoize-expirelru" ,perl-memoize-expirelru)
|
|
("perl-lingua-stem" ,perl-lingua-stem)
|
|
("perl-html-parser" ,perl-html-parser)
|
|
("perl-html-tagset" ,perl-html-tagset)))
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Tagger")
|
|
(synopsis "Part-of-speech tagger for English natural language processing")
|
|
(description "This module is a probability based, corpus-trained tagger
|
|
that assigns part-of-speech tags to English text based on a lookup dictionary
|
|
and a set of probability values. The tagger assigns appropriate tags based on
|
|
conditional probabilities - it examines the preceding tag to determine the
|
|
appropriate tag for the current word. Unknown words are classified according
|
|
to word morphology or can be set to be treated as nouns or other parts of
|
|
speech. The tagger also extracts as many nouns and noun phrases as it can,
|
|
using a set of regular expressions.")
|
|
(license gpl3)))
|
|
|
|
(define-public perl-lingua-en-words2nums
|
|
(package
|
|
(name "perl-lingua-en-words2nums")
|
|
(version "0.18")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/J/JO/JOEY/"
|
|
"Lingua-EN-Words2Nums-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"118xx8qr1zbx30psv7ic55w65h15mc1vz6zicshfm96jgiwmcrb8"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-EN-Words2Nums")
|
|
(synopsis "Convert English text to numbers")
|
|
(description "This module converts English text into numbers. It supports
|
|
both ordinal and cardinal numbers, negative numbers, and very large numbers.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-pt-stemmer
|
|
(package
|
|
(name "perl-lingua-pt-stemmer")
|
|
(version "0.02")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/"
|
|
"Lingua-PT-Stemmer-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"17c48sfbgwd2ivlgf59sr6jdhwa3aim8750f8pyzz7xpi8gz0var"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-PT-Stemmer")
|
|
(synopsis "Portuguese language stemming")
|
|
(description "This module implements a Portuguese stemming algorithm
|
|
proposed in the paper A Stemming Algorithm for the Portuguese Language by
|
|
Moreira, V. and Huyck, C.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-stem
|
|
(package
|
|
(name "perl-lingua-stem")
|
|
(version "0.84")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/S/SN/SNOWHARE/"
|
|
"Lingua-Stem-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"12avh2mnnc7llmmshrr5bgb473fvydxnlqrqbl2815mf2dp4pxcg"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs
|
|
`(("perl-module-build" ,perl-module-build)))
|
|
(propagated-inputs
|
|
`(("perl-lingua-pt-stemmer" ,perl-lingua-pt-stemmer)
|
|
("perl-lingua-stem-fr" ,perl-lingua-stem-fr)
|
|
("perl-lingua-stem-it" ,perl-lingua-stem-it)
|
|
("perl-lingua-stem-ru" ,perl-lingua-stem-ru)
|
|
("perl-lingua-stem-snowball-da" ,perl-lingua-stem-snowball-da)
|
|
("perl-snowball-norwegian" ,perl-snowball-norwegian)
|
|
("perl-snowball-swedish" ,perl-snowball-swedish)
|
|
("perl-text-german" ,perl-text-german)))
|
|
(home-page "https://metacpan.org/release/Lingua-Stem")
|
|
(synopsis "Stemming of words in various languages")
|
|
(description "This routine applies stemming algorithms to its parameters,
|
|
returning the stemmed words as appropriate to the selected locale.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-stem-fr
|
|
(package
|
|
(name "perl-lingua-stem-fr")
|
|
(version "0.02")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/S/SD/SDP/"
|
|
"Lingua-Stem-Fr-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0vyrspwzaqjxm5mqshf4wvwa3938mkajd1918d9ii2l9m2rn8kwx"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-Stem-Fr")
|
|
(synopsis "Porter's stemming algorithm for French")
|
|
(description "This module uses a modified version of the Porter Stemming
|
|
Algorithm to return a stemmed French word.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-stem-it
|
|
(package
|
|
(name "perl-lingua-stem-it")
|
|
(version "0.02")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/A/AC/ACALPINI/"
|
|
"Lingua-Stem-It-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1207r183s5hlh4mfwa6p46vzm0dhvrs2dnss5s41a0gyfkxp7riq"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-Stem-It")
|
|
(synopsis "Porter's stemming algorithm for Italian")
|
|
(description "This module applies the Porter Stemming Algorithm to its
|
|
parameters, returning the stemmed Italian word.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-stem-ru
|
|
(package
|
|
(name "perl-lingua-stem-ru")
|
|
(version "0.04")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/"
|
|
"Lingua-Stem-Ru-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0a2jmdz7jn32qj5hyiw5kbv8fvlpmws8i00a6xcbkzb48yvwww0j"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-Stem-Ru")
|
|
(synopsis "Porter's stemming algorithm for Russian")
|
|
(description "This module applies the Porter Stemming Algorithm to its
|
|
parameters, returning the stemmed Russian (KOI8-R only) word.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-lingua-stem-snowball-da
|
|
(package
|
|
(name "perl-lingua-stem-snowball-da")
|
|
(version "1.01")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/C/CI/CINE/"
|
|
"Lingua-Stem-Snowball-Da-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0mm0m7glm1s6i9f6a78jslw6wh573208arxhq93yriqmw17bwf9f"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Lingua-Stem-Snowball-Da")
|
|
(synopsis "Porters stemming algorithm for Danish")
|
|
(description "Lingua::Stem::Snowball::Da is a perl port of the danish
|
|
stemmer at http://snowball.sourceforge.net, it was originally altered from the
|
|
Lingua::Stem::Snowball::Se.")
|
|
(license gpl2)))
|
|
|
|
(define-public perl-snowball-norwegian
|
|
(package
|
|
(name "perl-snowball-norwegian")
|
|
(version "1.2")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/A/AS/ASKSH/"
|
|
"Snowball-Norwegian-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0675v45bbsh7vr7kpf36xs2q79g02iq1kmfw22h20xdk4rzqvkqx"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs `(("perl-module-build" ,perl-module-build)))
|
|
(home-page "https://metacpan.org/release/Snowball-Norwegian")
|
|
(synopsis "Porters stemming algorithm for Norwegian")
|
|
(description "Lingua::Stem::Snowball::No is a perl port of the norwegian
|
|
stemmer at http://snowball.tartarus.org.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-snowball-swedish
|
|
(package
|
|
(name "perl-snowball-swedish")
|
|
(version "1.2")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/A/AS/ASKSH/"
|
|
"Snowball-Swedish-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0agwc12jk5kmabnpsplw3wf4ii5w1zb159cpin44x3srb0sr5apg"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs `(("perl-module-build" ,perl-module-build)))
|
|
(home-page "https://metacpan.org/release/Snowball-Swedish")
|
|
(synopsis "Porters stemming algorithm for Swedish")
|
|
(description "Lingua::Stem::Snowball::Se is a perl port of the swedish
|
|
stemmer at http://snowball.sourceforge.net.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-string-toidentifier-en
|
|
(package
|
|
(name "perl-string-toidentifier-en")
|
|
(version "0.12")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/"
|
|
"String-ToIdentifier-EN-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"12nw7h2yiybhdw0vnnpc7bif8ylhsn6kqf6s39dsrf9h54iq9yrs"))))
|
|
(build-system perl-build-system)
|
|
(propagated-inputs
|
|
`(("perl-lingua-en-inflect-phrase" ,perl-lingua-en-inflect-phrase)
|
|
("perl-text-unidecode" ,perl-text-unidecode)
|
|
("perl-namespace-clean" ,perl-namespace-clean)))
|
|
(home-page "https://metacpan.org/release/String-ToIdentifier-EN")
|
|
(synopsis "Convert strings to English program identifiers")
|
|
(description "This module provides a utility method, \"to_identifier\" for
|
|
converting an arbitrary string into a readable representation using the ASCII
|
|
subset of \"\\w\" for use as an identifier in a computer program. The intent
|
|
is to make unique identifier names from which the content of the original
|
|
string can be easily inferred by a human just by reading the identifier.")
|
|
(license perl-license)))
|
|
|
|
(define-public perl-text-german
|
|
(package
|
|
(name "perl-text-german")
|
|
(version "0.06")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/U/UL/ULPFR/"
|
|
"Text-German-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1p87pgap99lw0nv62i3ghvsi7yg90lhn8vsa3yqp75rd04clybcj"))))
|
|
(build-system perl-build-system)
|
|
(home-page "https://metacpan.org/release/Text-German")
|
|
(synopsis "German grundform reduction")
|
|
(description "This module is a rather incomplete implementation of work
|
|
done by Gudrun Putze-Meier.")
|
|
(license perl-license)))
|