From fc436dbaea68ef727ec7bdba80e4bae4fcfe27b5 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:07:55 -0500 Subject: gnu: Add Lingua-EN-Words2Nums. * gnu/packages/language.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. --- gnu/packages/language.scm | 43 +++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 43 insertions(+) create mode 100644 gnu/packages/language.scm (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm new file mode 100644 index 0000000000..fbf27f0e71 --- /dev/null +++ b/gnu/packages/language.scm @@ -0,0 +1,43 @@ +;;; GNU Guix --- Functional package management for GNU +;;; Copyright © 2015 Eric Bavier +;;; +;;; This file is part of GNU Guix. +;;; +;;; GNU Guix is free software; you can redistribute it and/or modify it +;;; under the terms of the GNU General Public License as published by +;;; the Free Software Foundation; either version 3 of the License, or (at +;;; your option) any later version. +;;; +;;; GNU Guix is distributed in the hope that it will be useful, but +;;; WITHOUT ANY WARRANTY; without even the implied warranty of +;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +;;; GNU General Public License for more details. +;;; +;;; You should have received a copy of the GNU General Public License +;;; along with GNU Guix. If not, see . + +(define-module (gnu packages language) + #:use-module (gnu packages) + #:use-module (gnu packages perl) + #:use-module (guix packages) + #:use-module (guix build-system perl) + #:use-module (guix download)) + +(define-public perl-lingua-en-words2nums + (package + (name "perl-lingua-en-words2nums") + (version "0.18") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/J/JO/JOEY/" + "Lingua-EN-Words2Nums-" version ".tar.gz")) + (sha256 + (base32 + "118xx8qr1zbx30psv7ic55w65h15mc1vz6zicshfm96jgiwmcrb8")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-EN-Words2Nums") + (synopsis "Convert English text to numbers") + (description "This module converts English text into numbers. It supports +both ordinal and cardinal numbers, negative numbers, and very large numbers.") + (license (package-license perl)))) -- cgit 1.4.1 From 0c32bf01172118967d8a7a349313c4b4b06c0012 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:09:22 -0500 Subject: gnu: Add Lingua-EN-FindNumber. * gnu/packages/language.scm (perl-lingua-en-findnumber): New variable. --- gnu/packages/language.scm | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index fbf27f0e71..24e7fa447c 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -23,6 +23,28 @@ #:use-module (guix build-system perl) #:use-module (guix download)) +(define-public perl-lingua-en-findnumber + (package + (name "perl-lingua-en-findnumber") + (version "1.30") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/" + "Lingua-EN-FindNumber-" version ".tar.gz")) + (sha256 + (base32 + "0g5h6bwwggizwh3dd3xyx92537s4qy8nspshp1lrm9qlxh3prc28")))) + (build-system perl-build-system) + (propagated-inputs + `(("perl-lingua-en-words2nums" ,perl-lingua-en-words2nums))) + (home-page "http://search.cpan.org/dist/Lingua-EN-FindNumber") + (synopsis "Locate (written) numbers in English text ") + (description "This module provides a regular expression for finding +numbers in English text. It also provides functions for extracting and +manipulating such numbers.") + (license (package-license perl)))) + (define-public perl-lingua-en-words2nums (package (name "perl-lingua-en-words2nums") -- cgit 1.4.1 From 57ff0e04f18a253604a65d1e20128de2dff1dddd Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:13:17 -0500 Subject: gnu: Add Lingua-EN-Inflect. * gnu/packages/language.scm (perl-lingua-en-inflect): New variable. --- gnu/packages/language.scm | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 24e7fa447c..c02771d12a 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -45,6 +45,28 @@ numbers in English text. It also provides functions for extracting and manipulating such numbers.") (license (package-license perl)))) +(define-public perl-lingua-en-inflect + (package + (name "perl-lingua-en-inflect") + (version "1.895") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/D/DC/DCONWAY/" + "Lingua-EN-Inflect-" version ".tar.gz")) + (sha256 + (base32 + "0drzg9a2dkjxgf00n6jg0jzhd8972bh3j4wdnmdxpqi3zmfqhwcy")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-EN-Inflect") + (synopsis "Convert singular to plural") + (description "Lingua::EN::Inflect provides plural inflections, +\"a\"/\"an\" selection for English words, and manipulation of numbers as +words. Plural forms of all nouns, most verbs, and some adjectives are +provided. Where appropriate, \"classical\" variants (for example: \"brother\" +-> \"brethren\", \"dogma\" -> \"dogmata\", etc.) are also provided.") + (license (package-license perl)))) + (define-public perl-lingua-en-words2nums (package (name "perl-lingua-en-words2nums") -- cgit 1.4.1 From 4812a813a272261385d34d432cd1f2c46d403704 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:18:23 -0500 Subject: gnu: Add Lingua-EN-Inflect-Number. * gnu/packages/language.scm (perl-lingua-en-inflect-number): New variable. --- gnu/packages/language.scm | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index c02771d12a..2fdffa0b72 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -67,6 +67,28 @@ provided. Where appropriate, \"classical\" variants (for example: \"brother\" -> \"brethren\", \"dogma\" -> \"dogmata\", etc.) are also provided.") (license (package-license perl)))) +(define-public perl-lingua-en-inflect-number + (package + (name "perl-lingua-en-inflect-number") + (version "1.11") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/N/NE/NEILB/" + "Lingua-EN-Inflect-Number-" version ".tar.gz")) + (sha256 + (base32 + "0rvgrff96ja7fqr79dszmiyv2wz4izw82znah0mx9szkir657gfz")))) + (build-system perl-build-system) + (propagated-inputs + `(("perl-lingua-en-inflect" ,perl-lingua-en-inflect))) + (home-page "http://search.cpan.org/dist/Lingua-EN-Inflect-Number") + (synopsis "Force number of words to singular or plural") + (description "This module extends the functionality of Lingua::EN::Inflect +with three new functions for determining plurality of a word and forcefully +converting a word to singular or plural.") + (license (package-license perl)))) + (define-public perl-lingua-en-words2nums (package (name "perl-lingua-en-words2nums") -- cgit 1.4.1 From 930768b3e45ac66b2e868fe413ca2e35634c26ee Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:21:22 -0500 Subject: gnu: Add Lingua-EN-Number-IsOrdinal. * gnu/packages/language.scm (perl-lingua-en-number-isordinal): New variable. --- gnu/packages/language.scm | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 2fdffa0b72..f08c5e8f62 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -89,6 +89,30 @@ with three new functions for determining plurality of a word and forcefully converting a word to singular or plural.") (license (package-license perl)))) +(define-public perl-lingua-en-number-isordinal + (package + (name "perl-lingua-en-number-isordinal") + (version "0.04") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/" + "Lingua-EN-Number-IsOrdinal-" version ".tar.gz")) + (sha256 + (base32 + "1321fm4pyqcamffd0qsjm1gb07ijqndlb29qkcqf22kaibngfm4i")))) + (build-system perl-build-system) + (native-inputs + `(("perl-try-tiny" ,perl-try-tiny) + ("perl-test-fatal" ,perl-test-fatal))) + (propagated-inputs + `(("perl-lingua-en-findnumber" ,perl-lingua-en-findnumber))) + (home-page "http://search.cpan.org/dist/Lingua-EN-Number-IsOrdinal") + (synopsis "Detect if English number is ordinal or cardinal") + (description "This module will tell you if a number, either in words or as +digits, is a cardinal or ordinal number.") + (license (package-license perl)))) + (define-public perl-lingua-en-words2nums (package (name "perl-lingua-en-words2nums") -- cgit 1.4.1 From 9b446711e75aaf8e58a5f7f7536006590e91ace5 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:33:44 -0500 Subject: gnu: Add Lingua-PT-Stemmer. * gnu/packages/language.scm (perl-lingua-pt-stemmer): New variable. --- gnu/packages/language.scm | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index f08c5e8f62..be85b798b2 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -131,3 +131,23 @@ digits, is a cardinal or ordinal number.") (description "This module converts English text into numbers. It supports both ordinal and cardinal numbers, negative numbers, and very large numbers.") (license (package-license perl)))) + +(define-public perl-lingua-pt-stemmer + (package + (name "perl-lingua-pt-stemmer") + (version "0.01") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/X/XE/XERN/" + "Lingua-PT-Stemmer-" version ".tar.gz")) + (sha256 + (base32 + "11rqc5pqnkl9c13vy7sihiyas14ci0pj3k6chrgrgjv5sjv2m4a5")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-PT-Stemmer") + (synopsis "Portuguese language stemming") + (description "This module implements a Portuguese stemming algorithm +proposed in the paper A Stemming Algorithm for the Portuguese Language by +Moreira, V. and Huyck, C.") + (license (package-license perl)))) -- cgit 1.4.1 From df11e05241497e1e9e97178aaa93b9833acb2d65 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Mon, 16 Mar 2015 23:37:59 -0500 Subject: gnu: Add Lingua-Stem-Fr. * gnu/packages/language.scm (perl-lingua-stem-fr): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index be85b798b2..2886fed966 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -151,3 +151,22 @@ both ordinal and cardinal numbers, negative numbers, and very large numbers.") proposed in the paper A Stemming Algorithm for the Portuguese Language by Moreira, V. and Huyck, C.") (license (package-license perl)))) + +(define-public perl-lingua-stem-fr + (package + (name "perl-lingua-stem-fr") + (version "0.02") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/S/SD/SDP/" + "Lingua-Stem-Fr-" version ".tar.gz")) + (sha256 + (base32 + "0vyrspwzaqjxm5mqshf4wvwa3938mkajd1918d9ii2l9m2rn8kwx")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-Stem-Fr") + (synopsis "Porter's stemming algorithm for French") + (description "This module uses a modified version of the Porter Stemming +Algorithm to return a stemmed French word.") + (license (package-license perl)))) -- cgit 1.4.1 From 6afe59593b29c21fbd1e80ed589edad2b05bf828 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 09:04:24 -0500 Subject: gnu: Add Lingua-Stem-It. * gnu/packages/language.scm (perl-lingua-stem-it): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 2886fed966..ad222c785b 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -170,3 +170,22 @@ Moreira, V. and Huyck, C.") (description "This module uses a modified version of the Porter Stemming Algorithm to return a stemmed French word.") (license (package-license perl)))) + +(define-public perl-lingua-stem-it + (package + (name "perl-lingua-stem-it") + (version "0.02") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/A/AC/ACALPINI/" + "Lingua-Stem-It-" version ".tar.gz")) + (sha256 + (base32 + "1207r183s5hlh4mfwa6p46vzm0dhvrs2dnss5s41a0gyfkxp7riq")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-Stem-It") + (synopsis "Porter's stemming algorithm for Italian") + (description "This module applies the Porter Stemming Algorithm to its +parameters, returning the stemmed Italian word.") + (license (package-license perl)))) -- cgit 1.4.1 From 95d2eec1a8b6d8a5803a6911bec5d9f38951337b Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 09:59:28 -0500 Subject: gnu: Add Lingua-Stem-Ru. * gnu/packages/language.scm (perl-lingua-stem-ru): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index ad222c785b..ae972f961f 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -189,3 +189,22 @@ Algorithm to return a stemmed French word.") (description "This module applies the Porter Stemming Algorithm to its parameters, returning the stemmed Italian word.") (license (package-license perl)))) + +(define-public perl-lingua-stem-ru + (package + (name "perl-lingua-stem-ru") + (version "0.01") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/A/AL/ALGDR/" + "Lingua-Stem-Ru-" version ".tar.gz")) + (sha256 + (base32 + "0pqgg442fkf12ayh9fgmpa8q9x0iqx6s96181r52yn7s7pcs61h6")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-Stem-Ru") + (synopsis "Porter's stemming algorithm for Russian") + (description "This module applies the Porter Stemming Algorithm to its +parameters, returning the stemmed Russian (KOI8-R only) word.") + (license (package-license perl)))) -- cgit 1.4.1 From 30c400446c9f1e57582faf1d469afe0af2614511 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 10:11:27 -0500 Subject: gnu: Add Lingua-Stem-Snowball-Da. * gnu/packages/language.scm (perl-lingua-stem-snowball-da): New variable. --- gnu/packages/language.scm | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index ae972f961f..69c41c0a31 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -21,6 +21,7 @@ #:use-module (gnu packages perl) #:use-module (guix packages) #:use-module (guix build-system perl) + #:use-module ((guix licenses) #:select (gpl2)) #:use-module (guix download)) (define-public perl-lingua-en-findnumber @@ -208,3 +209,23 @@ parameters, returning the stemmed Italian word.") (description "This module applies the Porter Stemming Algorithm to its parameters, returning the stemmed Russian (KOI8-R only) word.") (license (package-license perl)))) + +(define-public perl-lingua-stem-snowball-da + (package + (name "perl-lingua-stem-snowball-da") + (version "1.01") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/C/CI/CINE/" + "Lingua-Stem-Snowball-Da-" version ".tar.gz")) + (sha256 + (base32 + "0mm0m7glm1s6i9f6a78jslw6wh573208arxhq93yriqmw17bwf9f")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Lingua-Stem-Snowball-Da") + (synopsis "Porters stemming algorithm for Danish") + (description "Lingua::Stem::Snowball::Da is a perl port of the danish +stemmer at http://snowball.sourceforge.net, it was originally altered from the +Lingua::Stem::Snowball::Se.") + (license gpl2))) -- cgit 1.4.1 From 1064abdc4204dde473dce7bd8f5b3ca8756e72f9 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 10:19:36 -0500 Subject: gnu: Add Snowball-Norwegian. * gnu/packages/language.scm (perl-snowball-norwegian): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 69c41c0a31..efc96d8830 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -229,3 +229,22 @@ parameters, returning the stemmed Russian (KOI8-R only) word.") stemmer at http://snowball.sourceforge.net, it was originally altered from the Lingua::Stem::Snowball::Se.") (license gpl2))) + +(define-public perl-snowball-norwegian + (package + (name "perl-snowball-norwegian") + (version "1.2") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/A/AS/ASKSH/" + "Snowball-Norwegian-" version ".tar.gz")) + (sha256 + (base32 + "0675v45bbsh7vr7kpf36xs2q79g02iq1kmfw22h20xdk4rzqvkqx")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Snowball-Norwegian") + (synopsis "Porters stemming algorithm for Norwegian") + (description "Lingua::Stem::Snowball::No is a perl port of the norwegian +stemmer at http://snowball.tartarus.org.") + (license (package-license perl)))) -- cgit 1.4.1 From 1f4b1129dcc834e98b5cb853108115da4b7fcf56 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 10:27:05 -0500 Subject: gnu: Add Snowball-Swedish. * gnu/packages/language.scm (perl-snowball-swedish): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index efc96d8830..07b16bc87e 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -248,3 +248,22 @@ Lingua::Stem::Snowball::Se.") (description "Lingua::Stem::Snowball::No is a perl port of the norwegian stemmer at http://snowball.tartarus.org.") (license (package-license perl)))) + +(define-public perl-snowball-swedish + (package + (name "perl-snowball-swedish") + (version "1.2") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/A/AS/ASKSH/" + "Snowball-Swedish-" version ".tar.gz")) + (sha256 + (base32 + "0agwc12jk5kmabnpsplw3wf4ii5w1zb159cpin44x3srb0sr5apg")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Snowball-Swedish") + (synopsis "Porters stemming algorithm for Swedish") + (description "Lingua::Stem::Snowball::Se is a perl port of the swedish +stemmer at http://snowball.sourceforge.net.") + (license (package-license perl)))) -- cgit 1.4.1 From 2b83abae5397ddb8f790e9113207e32eb06150e2 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 10:31:00 -0500 Subject: gnu: Add Text-German. * gnu/packages/language.scm (perl-text-german): New variable. --- gnu/packages/language.scm | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 07b16bc87e..b30dabc3a3 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -267,3 +267,22 @@ stemmer at http://snowball.tartarus.org.") (description "Lingua::Stem::Snowball::Se is a perl port of the swedish stemmer at http://snowball.sourceforge.net.") (license (package-license perl)))) + +(define-public perl-text-german + (package + (name "perl-text-german") + (version "0.06") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/U/UL/ULPFR/" + "Text-German-" version ".tar.gz")) + (sha256 + (base32 + "1p87pgap99lw0nv62i3ghvsi7yg90lhn8vsa3yqp75rd04clybcj")))) + (build-system perl-build-system) + (home-page "http://search.cpan.org/dist/Text-German") + (synopsis "German grundform reduction") + (description "This module is a rather incomplete implementaion of work +done by Gudrun Putze-Meier.") + (license (package-license perl)))) -- cgit 1.4.1 From 9766e4fef1745d46a0b0eb6bcf35b6f3653d09f2 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 10:34:35 -0500 Subject: gnu: Add Lingua-Stem. * gnu/packages/language.scm (perl-lingua-stem): New variable. --- gnu/packages/language.scm | 28 ++++++++++++++++++++++++++++ 1 file changed, 28 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index b30dabc3a3..fff651ba2e 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -153,6 +153,34 @@ proposed in the paper A Stemming Algorithm for the Portuguese Language by Moreira, V. and Huyck, C.") (license (package-license perl)))) +(define-public perl-lingua-stem + (package + (name "perl-lingua-stem") + (version "0.84") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/S/SN/SNOWHARE/" + "Lingua-Stem-" version ".tar.gz")) + (sha256 + (base32 + "12avh2mnnc7llmmshrr5bgb473fvydxnlqrqbl2815mf2dp4pxcg")))) + (build-system perl-build-system) + (propagated-inputs + `(("perl-lingua-pt-stemmer" ,perl-lingua-pt-stemmer) + ("perl-lingua-stem-fr" ,perl-lingua-stem-fr) + ("perl-lingua-stem-it" ,perl-lingua-stem-it) + ("perl-lingua-stem-ru" ,perl-lingua-stem-ru) + ("perl-lingua-stem-snowball-da" ,perl-lingua-stem-snowball-da) + ("perl-snowball-norwegian" ,perl-snowball-norwegian) + ("perl-snowball-swedish" ,perl-snowball-swedish) + ("perl-text-german" ,perl-text-german))) + (home-page "http://search.cpan.org/dist/Lingua-Stem") + (synopsis "Stemming of words in various languages") + (description "This routine applies stemming algorithms to its parameters, +returning the stemmed words as appropriate to the selected locale.") + (license (package-license perl)))) + (define-public perl-lingua-stem-fr (package (name "perl-lingua-stem-fr") -- cgit 1.4.1 From d7de088395e10ec0f35584afd50bc63b3a6d18c6 Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 11:03:31 -0500 Subject: gnu: Add Lingua-EN-Tagger. * gnu/packages/language.scm (perl-lingua-en-tagger): New variable. --- gnu/packages/language.scm | 33 ++++++++++++++++++++++++++++++++- 1 file changed, 32 insertions(+), 1 deletion(-) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index fff651ba2e..2c080cc602 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -19,9 +19,10 @@ (define-module (gnu packages language) #:use-module (gnu packages) #:use-module (gnu packages perl) + #:use-module (gnu packages web) #:use-module (guix packages) #:use-module (guix build-system perl) - #:use-module ((guix licenses) #:select (gpl2)) + #:use-module ((guix licenses) #:select (gpl2 gpl3)) #:use-module (guix download)) (define-public perl-lingua-en-findnumber @@ -114,6 +115,36 @@ converting a word to singular or plural.") digits, is a cardinal or ordinal number.") (license (package-license perl)))) +(define-public perl-lingua-en-tagger + (package + (name "perl-lingua-en-tagger") + (version "0.24") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/A/AC/ACOBURN/" + "Lingua-EN-Tagger-" version ".tar.gz")) + (sha256 + (base32 + "0qksqh1zi8fz76a29s2ll4g6yr8y6agmzgq7ngccvgj3gza5q241")))) + (build-system perl-build-system) + (propagated-inputs + `(("perl-memoize-expirelru" ,perl-memoize-expirelru) + ("perl-lingua-stem" ,perl-lingua-stem) + ("perl-html-parser" ,perl-html-parser) + ("perl-html-tagset" ,perl-html-tagset))) + (home-page "http://search.cpan.org/dist/Lingua-EN-Tagger") + (synopsis "Part-of-speech tagger for English natural language processing") + (description "This module is a probability based, corpus-trained tagger +that assigns part-of-speech tags to English text based on a lookup dictionary +and a set of probability values. The tagger assigns appropriate tags based on +conditional probabilities - it examines the preceding tag to determine the +appropriate tag for the current word. Unknown words are classified according +to word morphology or can be set to be treated as nouns or other parts of +speech. The tagger also extracts as many nouns and noun phrases as it can, +using a set of regular expressions.") + (license gpl3))) + (define-public perl-lingua-en-words2nums (package (name "perl-lingua-en-words2nums") -- cgit 1.4.1 From cfed969c730d127b2bb51d2c4283e2395685ac6a Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 11:12:30 -0500 Subject: gnu: Add Lingua-EN-Inflect-Phrase. * gnu/packages/language.scm (perl-lingua-en-inflect-phrase): New variable. --- gnu/packages/language.scm | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 2c080cc602..14958bdfbd 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -91,6 +91,33 @@ with three new functions for determining plurality of a word and forcefully converting a word to singular or plural.") (license (package-license perl)))) +(define-public perl-lingua-en-inflect-phrase + (package + (name "perl-lingua-en-inflect-phrase") + (version "0.18") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/" + "Lingua-EN-Inflect-Phrase-" version ".tar.gz")) + (sha256 + (base32 + "19prg6pkgnznrc82ymdkdi3l9schg815axjig7adca5yqa7mn2i9")))) + (build-system perl-build-system) + (native-inputs + `(("perl-test-nowarnings" ,perl-test-nowarnings))) + (propagated-inputs + `(("perl-lingua-en-findnumber" ,perl-lingua-en-findnumber) + ("perl-lingua-en-inflect" ,perl-lingua-en-inflect) + ("perl-lingua-en-inflect-number" ,perl-lingua-en-inflect-number) + ("perl-lingua-en-number-isordinal" ,perl-lingua-en-number-isordinal) + ("perl-lingua-en-tagger" ,perl-lingua-en-tagger))) + (home-page "http://search.cpan.org/dist/Lingua-EN-Inflect-Phrase") + (synopsis "Inflect short English phrases") + (description "This module attempts to pluralize or singularize short +English phrases.") + (license (package-license perl)))) + (define-public perl-lingua-en-number-isordinal (package (name "perl-lingua-en-number-isordinal") -- cgit 1.4.1 From f3bbbb7361f91504bc791c2c50721b8ee9f4db5a Mon Sep 17 00:00:00 2001 From: Eric Bavier Date: Tue, 17 Mar 2015 11:51:52 -0500 Subject: gnu: Add String-ToIdentifier-EN. * gnu/packages/language.scm (perl-string-toidentifier-en): New variable. --- gnu/packages/language.scm | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) (limited to 'gnu/packages/language.scm') diff --git a/gnu/packages/language.scm b/gnu/packages/language.scm index 14958bdfbd..f2f1fbc162 100644 --- a/gnu/packages/language.scm +++ b/gnu/packages/language.scm @@ -354,6 +354,32 @@ stemmer at http://snowball.tartarus.org.") stemmer at http://snowball.sourceforge.net.") (license (package-license perl)))) +(define-public perl-string-toidentifier-en + (package + (name "perl-string-toidentifier-en") + (version "0.11") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/R/RK/RKITOVER/" + "String-ToIdentifier-EN-" version ".tar.gz")) + (sha256 + (base32 + "1bawghkgkkx7j3avnrj5sg3vix1z5564ks6wf9az3jc2knh8s5nh")))) + (build-system perl-build-system) + (propagated-inputs + `(("perl-lingua-en-inflect-phrase" ,perl-lingua-en-inflect-phrase) + ("perl-text-unidecode" ,perl-text-unidecode) + ("perl-namespace-clean" ,perl-namespace-clean))) + (home-page "http://search.cpan.org/dist/String-ToIdentifier-EN") + (synopsis "Convert strings to english program identifiers") + (description "This module provides a utility method, \"to_identifier\" for +converting an arbitrary string into a readable representation using the ASCII +subset of \"\\w\" for use as an identifier in a computer program. The intent +is to make unique identifier names from which the content of the original +string can be easily inferred by a human just by reading the identifier.") + (license (package-license perl)))) + (define-public perl-text-german (package (name "perl-text-german") -- cgit 1.4.1