summaryrefslogtreecommitdiff
path: root/textproc
diff options
context:
space:
mode:
authoradam <adam@pkgsrc.org>2022-12-15 23:15:24 +0000
committeradam <adam@pkgsrc.org>2022-12-15 23:15:24 +0000
commit151404e9e5f53f230effab89df5cb5272d8bcb03 (patch)
tree5b7a081a3374c7737c25d30a17e581a98aca9394 /textproc
parent4f717ab85bcd60304301c8206e7815b7d309c8f0 (diff)
downloadpkgsrc-151404e9e5f53f230effab89df5cb5272d8bcb03.tar.gz
py-nltk: updated to 3.8
Version 3.8 2022-12-12 * Refactor dispersion plot * Provide type hints for LazyCorpusLoader variables * Throw warning when LanguageModel is initialized with incorrect vocabulary * Fix WordNet's all_synsets() function * Resolve TreebankWordDetokenizer inconsistency with end-of-string contractions * Support both iso639-3 codes and BCP-47 language tags * Avoid DeprecationWarning in Regexp tokenizer * Fix many doctests, add doctests to CI * Fix bool field not being read in VerbNet * Greatly improve time efficiency of SyllableTokenizer when tokenizing numbers * Fix encodings of Polish udhr corpus reader * Allow TweetTokenizer to tokenize emoji flag sequences * Prevent LazyModule from increasing the size of nltk.__dict__ * Fix CoreNLPServer non-default port issue * Add "acion" suffix to the Spanish SnowballStemmer * Allow loading WordNet without OMW * Use input() in nltk.chat.chatbot() for Jupyter support * Fix edit_distance_align() in distance.py * Tackle performance and accuracy regression of sentence tokenizer since NLTK 3.6.6 * Add the Iota operator to semantic logic * Resolve critical errors in WordNet app * Resolve critical error in CHILDES Corpus * Make WordNet information_content() accept adjective satellites * Add "strict=True" parameter to CoreNLP * Resolve issue with WordNet's synset_from_sense_key * Handle WordNet synsets that were lost in mapping * Resolve TypeError in Boxer * Add function to retrieve WordNet synonyms * Warn about nonexistent OMW offsets instead of raising an error * Fix missing ic argument in res, jcn and lin similarity functions of WordNet * Add support for the extended OMW * Fix LC cutoff policy of text tiling * Optimize ConditionalFreqDist.__add__ performance * Add Markdown corpus reader
Diffstat (limited to 'textproc')
-rw-r--r--textproc/py-nltk/Makefile4
-rw-r--r--textproc/py-nltk/PLIST23
-rw-r--r--textproc/py-nltk/distinfo8
3 files changed, 19 insertions, 16 deletions
diff --git a/textproc/py-nltk/Makefile b/textproc/py-nltk/Makefile
index f87b5f01105..2de9d5a38e7 100644
--- a/textproc/py-nltk/Makefile
+++ b/textproc/py-nltk/Makefile
@@ -1,6 +1,6 @@
-# $NetBSD: Makefile,v 1.8 2022/11/29 17:09:45 adam Exp $
+# $NetBSD: Makefile,v 1.9 2022/12/15 23:15:24 adam Exp $
-DISTNAME= nltk-3.7
+DISTNAME= nltk-3.8
PKGNAME= ${PYPKGPREFIX}-${DISTNAME}
CATEGORIES= textproc python
MASTER_SITES= ${MASTER_SITE_PYPI:=n/nltk/}
diff --git a/textproc/py-nltk/PLIST b/textproc/py-nltk/PLIST
index 640f2698034..5e475fdd71e 100644
--- a/textproc/py-nltk/PLIST
+++ b/textproc/py-nltk/PLIST
@@ -1,4 +1,4 @@
-@comment $NetBSD: PLIST,v 1.4 2022/11/29 17:09:45 adam Exp $
+@comment $NetBSD: PLIST,v 1.5 2022/12/15 23:15:24 adam Exp $
bin/nltk-${PYVERSSUFFIX}
${PYSITELIB}/${EGG_INFODIR}/PKG-INFO
${PYSITELIB}/${EGG_INFODIR}/SOURCES.txt
@@ -188,6 +188,9 @@ ${PYSITELIB}/nltk/corpus/reader/aligned.pyo
${PYSITELIB}/nltk/corpus/reader/api.py
${PYSITELIB}/nltk/corpus/reader/api.pyc
${PYSITELIB}/nltk/corpus/reader/api.pyo
+${PYSITELIB}/nltk/corpus/reader/bcp47.py
+${PYSITELIB}/nltk/corpus/reader/bcp47.pyc
+${PYSITELIB}/nltk/corpus/reader/bcp47.pyo
${PYSITELIB}/nltk/corpus/reader/bnc.py
${PYSITELIB}/nltk/corpus/reader/bnc.pyc
${PYSITELIB}/nltk/corpus/reader/bnc.pyo
@@ -239,6 +242,9 @@ ${PYSITELIB}/nltk/corpus/reader/knbc.pyo
${PYSITELIB}/nltk/corpus/reader/lin.py
${PYSITELIB}/nltk/corpus/reader/lin.pyc
${PYSITELIB}/nltk/corpus/reader/lin.pyo
+${PYSITELIB}/nltk/corpus/reader/markdown.py
+${PYSITELIB}/nltk/corpus/reader/markdown.pyc
+${PYSITELIB}/nltk/corpus/reader/markdown.pyo
${PYSITELIB}/nltk/corpus/reader/mte.py
${PYSITELIB}/nltk/corpus/reader/mte.pyc
${PYSITELIB}/nltk/corpus/reader/mte.pyo
@@ -401,6 +407,9 @@ ${PYSITELIB}/nltk/internals.pyo
${PYSITELIB}/nltk/jsontags.py
${PYSITELIB}/nltk/jsontags.pyc
${PYSITELIB}/nltk/jsontags.pyo
+${PYSITELIB}/nltk/langnames.py
+${PYSITELIB}/nltk/langnames.pyc
+${PYSITELIB}/nltk/langnames.pyo
${PYSITELIB}/nltk/lazyimport.py
${PYSITELIB}/nltk/lazyimport.pyc
${PYSITELIB}/nltk/lazyimport.pyo
@@ -729,9 +738,6 @@ ${PYSITELIB}/nltk/test/crubadan.doctest
${PYSITELIB}/nltk/test/data.doctest
${PYSITELIB}/nltk/test/dependency.doctest
${PYSITELIB}/nltk/test/discourse.doctest
-${PYSITELIB}/nltk/test/discourse_fixt.py
-${PYSITELIB}/nltk/test/discourse_fixt.pyc
-${PYSITELIB}/nltk/test/discourse_fixt.pyo
${PYSITELIB}/nltk/test/drt.doctest
${PYSITELIB}/nltk/test/featgram.doctest
${PYSITELIB}/nltk/test/featstruct.doctest
@@ -750,9 +756,6 @@ ${PYSITELIB}/nltk/test/grammar.doctest
${PYSITELIB}/nltk/test/grammartestsuites.doctest
${PYSITELIB}/nltk/test/index.doctest
${PYSITELIB}/nltk/test/inference.doctest
-${PYSITELIB}/nltk/test/inference_fixt.py
-${PYSITELIB}/nltk/test/inference_fixt.pyc
-${PYSITELIB}/nltk/test/inference_fixt.pyo
${PYSITELIB}/nltk/test/internals.doctest
${PYSITELIB}/nltk/test/japanese.doctest
${PYSITELIB}/nltk/test/lm.doctest
@@ -761,9 +764,6 @@ ${PYSITELIB}/nltk/test/meteor.doctest
${PYSITELIB}/nltk/test/metrics.doctest
${PYSITELIB}/nltk/test/misc.doctest
${PYSITELIB}/nltk/test/nonmonotonic.doctest
-${PYSITELIB}/nltk/test/nonmonotonic_fixt.py
-${PYSITELIB}/nltk/test/nonmonotonic_fixt.pyc
-${PYSITELIB}/nltk/test/nonmonotonic_fixt.pyo
${PYSITELIB}/nltk/test/paice.doctest
${PYSITELIB}/nltk/test/parse.doctest
${PYSITELIB}/nltk/test/portuguese_en.doctest
@@ -780,6 +780,9 @@ ${PYSITELIB}/nltk/test/resolution.doctest
${PYSITELIB}/nltk/test/semantics.doctest
${PYSITELIB}/nltk/test/sentiment.doctest
${PYSITELIB}/nltk/test/sentiwordnet.doctest
+${PYSITELIB}/nltk/test/setup_fixt.py
+${PYSITELIB}/nltk/test/setup_fixt.pyc
+${PYSITELIB}/nltk/test/setup_fixt.pyo
${PYSITELIB}/nltk/test/simple.doctest
${PYSITELIB}/nltk/test/stem.doctest
${PYSITELIB}/nltk/test/tag.doctest
diff --git a/textproc/py-nltk/distinfo b/textproc/py-nltk/distinfo
index 36742dfe78e..7f1e77fad4f 100644
--- a/textproc/py-nltk/distinfo
+++ b/textproc/py-nltk/distinfo
@@ -1,5 +1,5 @@
-$NetBSD: distinfo,v 1.6 2022/11/29 17:09:45 adam Exp $
+$NetBSD: distinfo,v 1.7 2022/12/15 23:15:24 adam Exp $
-BLAKE2s (nltk-3.7.zip) = 28c8e1bb3b834d1460e41e967473b89641fddc6db6b890e292a1ba8aa60519ee
-SHA512 (nltk-3.7.zip) = 8abe2d11875f769a4d23190b8da5807ee6a924fd5e07bfeb545f1a6e191eb1f49d02cbd80330f4261330598dd0936430c68513291f6e49fc275047c93e7f430a
-Size (nltk-3.7.zip) = 3293449 bytes
+BLAKE2s (nltk-3.8.zip) = abd3408550c17141c5ad16b590b26a84196d7a0c33d9ddcff77ef4eff0816e94
+SHA512 (nltk-3.8.zip) = 94ce94a0a5fc353e1802758b30c095d03dda044b337072e29ed0b17de509c0c3902b13bef7177adef1f0cbf57cd629ac9f8b1a242edcd3f3b4d206990b3cdcf8
+Size (nltk-3.8.zip) = 4619825 bytes