summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--var/spack/repos/builtin/packages/py-nltk/package.py177
1 files changed, 171 insertions, 6 deletions
diff --git a/var/spack/repos/builtin/packages/py-nltk/package.py b/var/spack/repos/builtin/packages/py-nltk/package.py
index 34dbc24b2f..80a3b07b5f 100644
--- a/var/spack/repos/builtin/packages/py-nltk/package.py
+++ b/var/spack/repos/builtin/packages/py-nltk/package.py
@@ -14,14 +14,19 @@ class PyNltk(PythonPackage):
homepage = "https://www.nltk.org/"
pypi = "nltk/nltk-3.5.zip"
+ version("3.8.1", sha256="1834da3d0682cba4f2cede2f9aad6b0fafb6461ba451db0efb6f9c39798d64d3")
version("3.5", sha256="845365449cd8c5f9731f7cb9f8bd6fd0767553b9d53af9eb1b3abf7700936b35")
+ maintainers("meyersbs")
+
variant("data", default=False, description="Download the NLTK data")
+ depends_on("python@3.7:", when="@3.8.1:", type=("build", "run"))
depends_on("python@3.5:", type=("build", "run"))
- depends_on("py-setuptools", type=("build", "run"))
+ depends_on("py-setuptools", type="build")
depends_on("py-joblib", type=("build", "run"))
depends_on("py-click", type=("build", "run"))
+ depends_on("py-regex@2021.8.3:", when="@3.8.1:", type=("build", "run"))
depends_on("py-regex", type=("build", "run"))
depends_on("py-tqdm", type=("build", "run"))
@@ -33,6 +38,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/misc",
placement="perluniprops",
)
+
resource(
name="mwa_ppdb",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/misc/mwa_ppdb.zip",
@@ -41,14 +47,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/misc",
placement="mwa_ppdb",
)
+
resource(
name="punkt",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/tokenizers/punkt.zip",
when="+data",
- sha256="9a74e3cc0057021b12984c07cc5e46cb746385cf90f49b7d6fe806fb71610144",
+ sha256="51c3078994aeaf650bfc8e028be4fb42b4a0d177d41c012b6a983979653660ec",
destination="nltk_data/tokenizers",
placement="punkt",
)
+
resource(
name="rslp",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/stemmers/rslp.zip",
@@ -57,6 +65,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/stemmers",
placement="rslp",
)
+
resource(
name="porter_test",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/stemmers/porter_test.zip",
@@ -65,6 +74,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/stemmers",
placement="porter_test",
)
+
resource(
name="snowball_data",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/stemmers/snowball_data.zip",
@@ -73,6 +83,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/stemmers",
placement="snowball_data",
)
+
resource(
name="maxent_ne_chunker",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/chunkers/maxent_ne_chunker.zip",
@@ -81,6 +92,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/chunkers",
placement="maxent_ne_chunker",
)
+
resource(
name="moses_sample",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/models/moses_sample.zip",
@@ -89,6 +101,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/models",
placement="moses_sample",
)
+
resource(
name="bllip_wsj_no_aux",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/models/bllip_wsj_no_aux.zip",
@@ -97,6 +110,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/models",
placement="bllip_wsj_no_aux",
)
+
resource(
name="word2vec_sample",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/models/word2vec_sample.zip",
@@ -105,6 +119,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/models",
placement="word2vec_sample",
)
+
resource(
name="wmt15_eval",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/models/wmt15_eval.zip",
@@ -113,6 +128,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/models",
placement="wmt15_eval",
)
+
resource(
name="spanish_grammars",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/grammars/spanish_grammars.zip",
@@ -121,6 +137,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/grammars",
placement="spanish_grammars",
)
+
resource(
name="sample_grammars",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/grammars/sample_grammars.zip",
@@ -129,6 +146,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/grammars",
placement="sample_grammars",
)
+
resource(
name="large_grammars",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/grammars/large_grammars.zip",
@@ -137,6 +155,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/grammars",
placement="large_grammars",
)
+
resource(
name="book_grammars",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/grammars/book_grammars.zip",
@@ -145,6 +164,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/grammars",
placement="book_grammars",
)
+
resource(
name="basque_grammars",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/grammars/basque_grammars.zip",
@@ -153,6 +173,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/grammars",
placement="basque_grammars",
)
+
resource(
name="maxent_treebank_pos_tagger",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/taggers/maxent_treebank_pos_tagger.zip",
@@ -161,6 +182,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/taggers",
placement="maxent_treebank_pos_tagger",
)
+
resource(
name="averaged_perceptron_tagger",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/taggers/averaged_perceptron_tagger.zip",
@@ -169,6 +191,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/taggers",
placement="averaged_perceptron_tagger",
)
+
resource(
name="averaged_perceptron_tagger_ru",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/taggers/averaged_perceptron_tagger_ru.zip",
@@ -177,14 +200,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/taggers",
placement="averaged_perceptron_tagger_ru",
)
+
resource(
name="universal_tagset",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/taggers/universal_tagset.zip",
when="+data",
- sha256="fb3b295a7b636d3f50e2bd3f9bd4c84eb99eaf36ff475ea406bdecd247f8f962",
+ sha256="d490e1ae8f5625dcdfdda04be15c22a2aade8c2561a36a61edcdf0c7d6aa8352",
destination="nltk_data/taggers",
placement="universal_tagset",
)
+
resource(
name="vader_lexicon",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/sentiment/vader_lexicon.zip",
@@ -193,6 +218,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/sentiment",
placement="vader_lexicon",
)
+
resource(
name="lin_thesaurus",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/lin_thesaurus.zip",
@@ -201,6 +227,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="lin_thesaurus",
)
+
resource(
name="movie_reviews",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/movie_reviews.zip",
@@ -209,6 +236,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="movie_reviews",
)
+
resource(
name="problem_reports",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/problem_reports.zip",
@@ -217,6 +245,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="problem_reports",
)
+
resource(
name="pros_cons",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/pros_cons.zip",
@@ -225,6 +254,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="pros_cons",
)
+
resource(
name="masc_tagged",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/masc_tagged.zip",
@@ -233,6 +263,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="masc_tagged",
)
+
resource(
name="sentence_polarity",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/sentence_polarity.zip",
@@ -241,6 +272,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="sentence_polarity",
)
+
resource(
name="webtext",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/webtext.zip",
@@ -249,6 +281,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="webtext",
)
+
resource(
name="nps_chat",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/nps_chat.zip",
@@ -257,6 +290,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="nps_chat",
)
+
resource(
name="city_database",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/city_database.zip",
@@ -265,6 +299,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="city_database",
)
+
resource(
name="europarl_raw",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/europarl_raw.zip",
@@ -273,6 +308,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="europarl_raw",
)
+
resource(
name="biocreative_ppi",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/biocreative_ppi.zip",
@@ -281,6 +317,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="biocreative_ppi",
)
+
resource(
name="verbnet3",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/verbnet3.zip",
@@ -289,6 +326,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="verbnet3",
)
+
resource(
name="pe08",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/pe08.zip",
@@ -297,6 +335,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="pe08",
)
+
resource(
name="pil",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/pil.zip",
@@ -305,6 +344,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="pil",
)
+
resource(
name="crubadan",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/crubadan.zip",
@@ -313,6 +353,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="crubadan",
)
+
resource(
name="gutenberg",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/gutenberg.zip",
@@ -321,6 +362,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="gutenberg",
)
+
resource(
name="propbank",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/propbank.zip",
@@ -329,6 +371,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="propbank",
)
+
resource(
name="machado",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/machado.zip",
@@ -337,6 +380,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="machado",
)
+
resource(
name="state_union",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/state_union.zip",
@@ -345,6 +389,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="state_union",
)
+
resource(
name="twitter_samples",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/twitter_samples.zip",
@@ -353,6 +398,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="twitter_samples",
)
+
resource(
name="semcor",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/semcor.zip",
@@ -361,6 +407,25 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="semcor",
)
+
+ resource(
+ name="wordnet31",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/wordnet31.zip",
+ when="+data",
+ sha256="2a9e7da7d0c17ad875e4171a4d28ae17ab6969c7d67f1cf0f59d65c66d0fdd37",
+ destination="nltk_data/corpora",
+ placement="wordnet31",
+ )
+
+ resource(
+ name="extended_omw",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/extended_omw.zip",
+ when="+data",
+ sha256="c59b90f2902c351eeb0ce97a49a1b7cf73d4e2f5b05cbda0e903eb20b5ee168a",
+ destination="nltk_data/corpora",
+ placement="extended_omw",
+ )
+
resource(
name="names",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/names.zip",
@@ -369,6 +434,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="names",
)
+
resource(
name="ptb",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/ptb.zip",
@@ -377,6 +443,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="ptb",
)
+
resource(
name="nombank.1.0",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/nombank.1.0.zip",
@@ -385,6 +452,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="nombank.1.0",
)
+
resource(
name="floresta",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/floresta.zip",
@@ -393,6 +461,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="floresta",
)
+
resource(
name="comtrans",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/comtrans.zip",
@@ -401,6 +470,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="comtrans",
)
+
resource(
name="knbc",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/knbc.zip",
@@ -409,6 +479,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="knbc",
)
+
resource(
name="mac_morpho",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/mac_morpho.zip",
@@ -417,6 +488,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="mac_morpho",
)
+
resource(
name="swadesh",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/swadesh.zip",
@@ -425,6 +497,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="swadesh",
)
+
resource(
name="rte",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/rte.zip",
@@ -433,6 +506,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="rte",
)
+
resource(
name="toolbox",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/toolbox.zip",
@@ -441,6 +515,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="toolbox",
)
+
resource(
name="jeita",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/jeita.zip",
@@ -449,6 +524,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="jeita",
)
+
resource(
name="product_reviews_1",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/product_reviews_1.zip",
@@ -457,6 +533,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="product_reviews_1",
)
+
resource(
name="omw",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/omw.zip",
@@ -465,6 +542,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="omw",
)
+
+ resource(
+ name="wordnet2022",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/wordnet2022.zip",
+ when="+data",
+ sha256="5ccbb3382b9d147d4acac12645b3d6f375d1f5e4cd037fedadef74d069a8ee3f",
+ destination="nltk_data/corpora",
+ placement="wordnet2022",
+ )
+
resource(
name="sentiwordnet",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/sentiwordnet.zip",
@@ -473,6 +560,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="sentiwordnet",
)
+
resource(
name="product_reviews_2",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/product_reviews_2.zip",
@@ -481,6 +569,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="product_reviews_2",
)
+
resource(
name="abc",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/abc.zip",
@@ -489,6 +578,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="abc",
)
+
+ resource(
+ name="wordnet2021",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/wordnet2021.zip",
+ when="+data",
+ sha256="d7ef7d289da4dd0f33f07d9745856adc74689a53a8fa9be5dcfd3c87c5da24db",
+ destination="nltk_data/corpora",
+ placement="wordnet2021",
+ )
+
resource(
name="udhr2",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/udhr2.zip",
@@ -497,6 +596,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="udhr2",
)
+
resource(
name="senseval",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/senseval.zip",
@@ -505,6 +605,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="senseval",
)
+
resource(
name="words",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/words.zip",
@@ -513,6 +614,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="words",
)
+
resource(
name="framenet_v15",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/framenet_v15.zip",
@@ -521,6 +623,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="framenet_v15",
)
+
resource(
name="unicode_samples",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/unicode_samples.zip",
@@ -529,6 +632,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="unicode_samples",
)
+
resource(
name="kimmo",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/kimmo.zip",
@@ -537,6 +641,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="kimmo",
)
+
resource(
name="framenet_v17",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/framenet_v17.zip",
@@ -545,6 +650,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="framenet_v17",
)
+
resource(
name="chat80",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/chat80.zip",
@@ -553,6 +659,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="chat80",
)
+
resource(
name="qc",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/qc.zip",
@@ -561,14 +668,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="qc",
)
+
resource(
name="inaugural",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/inaugural.zip",
when="+data",
- sha256="a6c099af7f5b5ad2a03f1e4ea3f5ff7699779b9d4327152110af462da210bd1f",
+ sha256="7c5fb5793e31fbeae12bf1aa0ffda5336468f07cedb50654c6d31ca384e2046b",
destination="nltk_data/corpora",
placement="inaugural",
)
+
resource(
name="wordnet",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/wordnet.zip",
@@ -577,14 +686,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="wordnet",
)
+
resource(
name="stopwords",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/stopwords.zip",
when="+data",
- sha256="3fc8d3d4c6e3d5ba6e23a66920dd3fde611cc3edf6e1fd80159a7965f47bea09",
+ sha256="15c94179887425ca1bedc265608cab9f27d650211f709bb929e320990a4b01d1",
destination="nltk_data/corpora",
placement="stopwords",
)
+
resource(
name="verbnet",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/verbnet.zip",
@@ -593,6 +704,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="verbnet",
)
+
resource(
name="shakespeare",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/shakespeare.zip",
@@ -601,6 +713,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="shakespeare",
)
+
resource(
name="ycoe",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/ycoe.zip",
@@ -609,6 +722,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="ycoe",
)
+
resource(
name="ieer",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/ieer.zip",
@@ -617,6 +731,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="ieer",
)
+
resource(
name="cess_cat",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/cess_cat.zip",
@@ -625,6 +740,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="cess_cat",
)
+
resource(
name="switchboard",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/switchboard.zip",
@@ -633,6 +749,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="switchboard",
)
+
resource(
name="comparative_sentences",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/comparative_sentences.zip",
@@ -641,6 +758,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="comparative_sentences",
)
+
resource(
name="subjectivity",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/subjectivity.zip",
@@ -649,6 +767,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="subjectivity",
)
+
resource(
name="udhr",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/udhr.zip",
@@ -657,6 +776,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="udhr",
)
+
resource(
name="pl196x",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/pl196x.zip",
@@ -665,6 +785,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="pl196x",
)
+
resource(
name="paradigms",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/paradigms.zip",
@@ -673,6 +794,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="paradigms",
)
+
resource(
name="gazetteers",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/gazetteers.zip",
@@ -681,6 +803,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="gazetteers",
)
+
resource(
name="timit",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/timit.zip",
@@ -689,6 +812,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="timit",
)
+
resource(
name="treebank",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/treebank.zip",
@@ -697,14 +821,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="treebank",
)
+
resource(
name="sinica_treebank",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/sinica_treebank.zip",
when="+data",
- sha256="5506ddf646d5c3fb0a5fffdb53330ec8465f6468499f08d86f77d2df01d5b35e",
+ sha256="395958a28f06d92ce1de0f0cf1bb17dc4a5cc882d27487447252ad615641e9ba",
destination="nltk_data/corpora",
placement="sinica_treebank",
)
+
resource(
name="opinion_lexicon",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/opinion_lexicon.zip",
@@ -713,6 +839,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="opinion_lexicon",
)
+
resource(
name="ppattach",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/ppattach.zip",
@@ -721,6 +848,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="ppattach",
)
+
resource(
name="dependency_treebank",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/dependency_treebank.zip",
@@ -729,6 +857,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="dependency_treebank",
)
+
resource(
name="reuters",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/reuters.zip",
@@ -737,6 +866,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="reuters",
)
+
resource(
name="genesis",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/genesis.zip",
@@ -745,6 +875,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="genesis",
)
+
resource(
name="cess_esp",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/cess_esp.zip",
@@ -753,6 +884,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="cess_esp",
)
+
resource(
name="conll2007",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/conll2007.zip",
@@ -761,6 +893,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="conll2007",
)
+
resource(
name="nonbreaking_prefixes",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/nonbreaking_prefixes.zip",
@@ -769,6 +902,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="nonbreaking_prefixes",
)
+
resource(
name="dolch",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/dolch.zip",
@@ -777,6 +911,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="dolch",
)
+
resource(
name="smultron",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/smultron.zip",
@@ -785,6 +920,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="smultron",
)
+
resource(
name="alpino",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/alpino.zip",
@@ -793,6 +929,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="alpino",
)
+
resource(
name="wordnet_ic",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/wordnet_ic.zip",
@@ -801,6 +938,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="wordnet_ic",
)
+
resource(
name="brown",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/brown.zip",
@@ -809,6 +947,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="brown",
)
+
+ resource(
+ name="bcp47",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/bcp47.zip",
+ when="+data",
+ sha256="435d986fd9de0ae540a34e0978dbbaf5d1db7576b2bc7571da71cf6a01c8dfaa",
+ destination="nltk_data/corpora",
+ placement="bcp47",
+ )
+
resource(
name="panlex_swadesh",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/panlex_swadesh.zip",
@@ -817,6 +965,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="panlex_swadesh",
)
+
resource(
name="conll2000",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/conll2000.zip",
@@ -825,6 +974,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="conll2000",
)
+
resource(
name="universal_treebanks_v20",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/universal_treebanks_v20.zip",
@@ -833,6 +983,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="universal_treebanks_v20",
)
+
resource(
name="brown_tei",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/brown_tei.zip",
@@ -841,6 +992,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="brown_tei",
)
+
resource(
name="cmudict",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/cmudict.zip",
@@ -849,6 +1001,16 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="cmudict",
)
+
+ resource(
+ name="omw-1.4",
+ url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/omw-1.4.zip",
+ when="+data",
+ sha256="3b941e664852f3297b6040236626065796a2aaf7d7f9eec8779a3beaa1096c2d",
+ destination="nltk_data/corpora",
+ placement="omw-1.4",
+ )
+
resource(
name="mte_teip5",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/mte_teip5.zip",
@@ -857,6 +1019,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="mte_teip5",
)
+
resource(
name="indian",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/indian.zip",
@@ -865,6 +1028,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="indian",
)
+
resource(
name="conll2002",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/corpora/conll2002.zip",
@@ -873,6 +1037,7 @@ class PyNltk(PythonPackage):
destination="nltk_data/corpora",
placement="conll2002",
)
+
resource(
name="tagsets",
url="https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/help/tagsets.zip",