forked from pool/python-nltk
Accepting request 1160467 from home:bnavigator:branches:devel:languages:python
- Update to 3.8.1 * Resolve RCE & XSS vulnerabilities in localhost WordNet Browser * Add Python 3.11 support - Update nltk_data archive - Drop port-2to3.patch - Add nltk-pr3207-py312.patch for Python 3.12 support * gh#nltk/nltk#3207 OBS-URL: https://build.opensuse.org/request/show/1160467 OBS-URL: https://build.opensuse.org/package/show/devel:languages:python/python-nltk?expand=0&rev=45
This commit is contained in:
parent
3547d0cab5
commit
f64d1a206e
3
nltk-3.8.1.zip
Normal file
3
nltk-3.8.1.zip
Normal file
@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:1834da3d0682cba4f2cede2f9aad6b0fafb6461ba451db0efb6f9c39798d64d3
|
||||||
|
size 4620388
|
@ -1,3 +0,0 @@
|
|||||||
version https://git-lfs.github.com/spec/v1
|
|
||||||
oid sha256:74b30826a37d78d53427105bbd037dd880251be269fca64ee530838a46ed55fc
|
|
||||||
size 4619825
|
|
1782
nltk-pr3207-py312.patch
Normal file
1782
nltk-pr3207-py312.patch
Normal file
File diff suppressed because it is too large
Load Diff
@ -1,3 +1,3 @@
|
|||||||
version https://git-lfs.github.com/spec/v1
|
version https://git-lfs.github.com/spec/v1
|
||||||
oid sha256:f41383a4774bf7227f4563f46543460ba07a6921f7bcc6185519e87ea9e4323f
|
oid sha256:f79462ac99f414b4850943720bed4a59c1bb15bfc8f1ce16b26165da6db07680
|
||||||
size 453871052
|
size 393271816
|
||||||
|
@ -1,48 +0,0 @@
|
|||||||
---
|
|
||||||
nltk_data/corpora/pl196x/splitter.py | 4 ++--
|
|
||||||
nltk_data/taggers/universal_tagset/universal_tags.py | 5 -----
|
|
||||||
tools/find_deprecated.py | 2 +-
|
|
||||||
3 files changed, 3 insertions(+), 8 deletions(-)
|
|
||||||
|
|
||||||
--- a/nltk_data/corpora/pl196x/splitter.py
|
|
||||||
+++ b/nltk_data/corpora/pl196x/splitter.py
|
|
||||||
@@ -1,4 +1,4 @@
|
|
||||||
-#!/usr/bin/python
|
|
||||||
+#!/usr/bin/python3
|
|
||||||
|
|
||||||
import sys, re
|
|
||||||
|
|
||||||
@@ -7,7 +7,7 @@ TEXTID = re.compile(r'<text id="(.*)">')
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
|
||||||
if len(sys.argv) != 2:
|
|
||||||
- print 'One argument required: a pl196x corpus to split.'
|
|
||||||
+ print('One argument required: a pl196x corpus to split.')
|
|
||||||
sys.exit()
|
|
||||||
|
|
||||||
inputFileName = sys.argv[1]
|
|
||||||
--- a/nltk_data/taggers/universal_tagset/universal_tags.py
|
|
||||||
+++ b/nltk_data/taggers/universal_tagset/universal_tags.py
|
|
||||||
@@ -22,11 +22,6 @@ X - other: foreign words, typos, abbrevi
|
|
||||||
@author: Nathan Schneider (nschneid)
|
|
||||||
@since: 2011-05-06
|
|
||||||
'''
|
|
||||||
-
|
|
||||||
-# Strive towards Python 3 compatibility
|
|
||||||
-from __future__ import print_function, unicode_literals, division
|
|
||||||
-from future_builtins import map, filter
|
|
||||||
-
|
|
||||||
import re, glob
|
|
||||||
from collections import defaultdict
|
|
||||||
|
|
||||||
--- a/tools/find_deprecated.py
|
|
||||||
+++ b/tools/find_deprecated.py
|
|
||||||
@@ -29,7 +29,7 @@ import textwrap
|
|
||||||
import tokenize
|
|
||||||
from doctest import DocTestParser, register_optionflag
|
|
||||||
|
|
||||||
-from cStringIO import StringIO
|
|
||||||
+from io import StringIO
|
|
||||||
|
|
||||||
import nltk.corpus
|
|
||||||
from nltk import defaultdict
|
|
@ -1,3 +1,14 @@
|
|||||||
|
-------------------------------------------------------------------
|
||||||
|
Thu Mar 21 17:41:52 UTC 2024 - Ben Greiner <code@bnavigator.de>
|
||||||
|
|
||||||
|
- Update to 3.8.1
|
||||||
|
* Resolve RCE & XSS vulnerabilities in localhost WordNet Browser
|
||||||
|
* Add Python 3.11 support
|
||||||
|
- Update nltk_data archive
|
||||||
|
- Drop port-2to3.patch
|
||||||
|
- Add nltk-pr3207-py312.patch for Python 3.12 support
|
||||||
|
* gh#nltk/nltk#3207
|
||||||
|
|
||||||
-------------------------------------------------------------------
|
-------------------------------------------------------------------
|
||||||
Tue Mar 28 08:36:04 UTC 2023 - pgajdos@suse.com
|
Tue Mar 28 08:36:04 UTC 2023 - pgajdos@suse.com
|
||||||
|
|
||||||
|
@ -1 +1,2 @@
|
|||||||
addFilter("E: zero-length /usr/lib/python3\.\d/site-packages/nltk/tbl/api\.py")
|
addFilter("E: zero-length /usr/lib/python3\.\d+/site-packages/nltk/tbl/api\.py")
|
||||||
|
addFilter("explicit-lib-dependency python3\d*-joblib")
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#
|
#
|
||||||
# spec file for package python-nltk
|
# spec file for package python-nltk
|
||||||
#
|
#
|
||||||
# Copyright (c) 2023 SUSE LLC
|
# Copyright (c) 2024 SUSE LLC
|
||||||
#
|
#
|
||||||
# All modifications and additions to the file contributed by third parties
|
# All modifications and additions to the file contributed by third parties
|
||||||
# remain the property of their copyright owners, unless otherwise agreed
|
# remain the property of their copyright owners, unless otherwise agreed
|
||||||
@ -16,55 +16,86 @@
|
|||||||
#
|
#
|
||||||
|
|
||||||
|
|
||||||
%{!?python_module:%define python_module() python-%{**} python3-%{**}}
|
|
||||||
%define pyname nltk
|
|
||||||
%define skip_python2 1
|
|
||||||
Name: python-nltk
|
Name: python-nltk
|
||||||
Version: 3.8
|
Version: 3.8.1
|
||||||
Release: 0
|
Release: 0
|
||||||
Summary: Natural Language Toolkit
|
Summary: Natural Language Toolkit
|
||||||
License: Apache-2.0
|
License: Apache-2.0
|
||||||
URL: http://nltk.org/
|
URL: http://nltk.org/
|
||||||
Source0: https://files.pythonhosted.org/packages/source/n/nltk/%{pyname}-%{version}.zip
|
# SourceRepository: https://github.com/nltk/nltk
|
||||||
# Downloaded NLTK data via python3 -m nltk.downloader,
|
Source0: https://files.pythonhosted.org/packages/source/n/nltk/nltk-%{version}.zip
|
||||||
# then unzip downloaded zip archive.
|
# Download/Update NLTK data:
|
||||||
|
# quilt setup python-nltk.spec
|
||||||
|
# pushd nltk-?.?.?
|
||||||
|
# python3 -m nltk.downloader -d nltk_data tests \
|
||||||
|
# averaged_perceptron_tagger_ru \
|
||||||
|
# brown \
|
||||||
|
# cess_cat \
|
||||||
|
# cess_esp \
|
||||||
|
# conll2007 \
|
||||||
|
# floresta \
|
||||||
|
# gutenberg \
|
||||||
|
# inaugural \
|
||||||
|
# indian \
|
||||||
|
# large_grammars \
|
||||||
|
# nombank.1.0 \
|
||||||
|
# omw-1.4 \
|
||||||
|
# pl196x \
|
||||||
|
# ptb \
|
||||||
|
# punkt \
|
||||||
|
# rte \
|
||||||
|
# sinica_treebank \
|
||||||
|
# stopwords \
|
||||||
|
# treebank \
|
||||||
|
# udhr \
|
||||||
|
# universal_tagset \
|
||||||
|
# wordnet \
|
||||||
|
# wordnet_ic \
|
||||||
|
# words
|
||||||
|
# tar -cJf ../nltk_data.tar.xz nltk_data
|
||||||
|
# popd
|
||||||
# see https://www.nltk.org/data.html for more details
|
# see https://www.nltk.org/data.html for more details
|
||||||
Source1: nltk_data.tar.xz
|
Source1: nltk_data.tar.xz
|
||||||
Source99: python-nltk.rpmlintrc
|
Source99: python-nltk.rpmlintrc
|
||||||
# PATCH-FIX-UPSTREAM skip-networked-test.patch gh#nltk/nltk#2969 mcepl@suse.com
|
# PATCH-FIX-UPSTREAM skip-networked-test.patch gh#nltk/nltk#2969 mcepl@suse.com
|
||||||
# skip tests requiring network connection
|
# skip tests requiring network connection
|
||||||
Patch0: skip-networked-test.patch
|
Patch0: skip-networked-test.patch
|
||||||
# PATCH-FIX-UPSTREAM port-2to3.patch bsc#[0-9]+ mcepl@suse.com
|
# PATCH-FIX-UPSTREAM nltk-pr3207-py312.patch gh#nltk/nltk#3207
|
||||||
# port scripts in nltk_data to Python 3
|
Patch1: nltk-pr3207-py312.patch
|
||||||
Patch1: port-2to3.patch
|
BuildRequires: %{python_module base >= 3.7}
|
||||||
BuildRequires: %{python_module regex}
|
BuildRequires: %{python_module pip}
|
||||||
BuildRequires: %{python_module setuptools}
|
BuildRequires: %{python_module setuptools}
|
||||||
|
BuildRequires: %{python_module wheel}
|
||||||
BuildRequires: %{pythons}
|
BuildRequires: %{pythons}
|
||||||
BuildRequires: fdupes
|
BuildRequires: fdupes
|
||||||
BuildRequires: python-rpm-macros
|
BuildRequires: python-rpm-macros
|
||||||
BuildRequires: unzip
|
BuildRequires: unzip
|
||||||
# For testing
|
# SECTION runtime
|
||||||
BuildRequires: %{python_module tk}
|
BuildRequires: %{python_module regex >= 2021.8.3}
|
||||||
BuildRequires: %{python_module click}
|
BuildRequires: %{python_module click}
|
||||||
BuildRequires: %{python_module pytest}
|
|
||||||
# BuildRequires: %%{python_module gensim}
|
|
||||||
BuildRequires: %{python_module joblib}
|
BuildRequires: %{python_module joblib}
|
||||||
|
BuildRequires: %{python_module tqdm}
|
||||||
|
# /SECTION
|
||||||
|
# SECTION test
|
||||||
|
BuildRequires: %{python_module tk}
|
||||||
BuildRequires: %{python_module Jinja2}
|
BuildRequires: %{python_module Jinja2}
|
||||||
BuildRequires: %{python_module matplotlib}
|
BuildRequires: %{python_module matplotlib}
|
||||||
BuildRequires: %{python_module numpy}
|
BuildRequires: %{python_module numpy}
|
||||||
BuildRequires: %{python_module pyparsing}
|
BuildRequires: %{python_module pyparsing}
|
||||||
BuildRequires: %{python_module pytest-cov}
|
BuildRequires: %{python_module pytest-cov}
|
||||||
BuildRequires: %{python_module pytest-mock}
|
BuildRequires: %{python_module pytest-mock}
|
||||||
|
BuildRequires: %{python_module pytest}
|
||||||
BuildRequires: %{python_module python-crfsuite}
|
BuildRequires: %{python_module python-crfsuite}
|
||||||
BuildRequires: %{python_module regex}
|
|
||||||
BuildRequires: %{python_module requests}
|
BuildRequires: %{python_module requests}
|
||||||
BuildRequires: %{python_module scikit-learn}
|
BuildRequires: %{python_module scikit-learn}
|
||||||
BuildRequires: %{python_module scipy}
|
BuildRequires: %{python_module scipy}
|
||||||
BuildRequires: %{python_module text-unidecode}
|
BuildRequires: %{python_module text-unidecode}
|
||||||
BuildRequires: %{python_module tqdm}
|
|
||||||
BuildRequires: %{python_module twython}
|
BuildRequires: %{python_module twython}
|
||||||
#
|
# /SECTION
|
||||||
Requires: python-regex
|
Requires: python-regex >= 2021.8.3
|
||||||
|
Requires: python-click
|
||||||
|
Requires: python-joblib
|
||||||
|
Requires: python-tqdm
|
||||||
Recommends: python-gensim
|
Recommends: python-gensim
|
||||||
Recommends: python-matplotlib
|
Recommends: python-matplotlib
|
||||||
Recommends: python-numpy
|
Recommends: python-numpy
|
||||||
@ -75,7 +106,7 @@ Recommends: python-scikit-learn
|
|||||||
Recommends: python-scipy
|
Recommends: python-scipy
|
||||||
Recommends: python-twython
|
Recommends: python-twython
|
||||||
Requires(post): update-alternatives
|
Requires(post): update-alternatives
|
||||||
Requires(postun):update-alternatives
|
Requires(postun): update-alternatives
|
||||||
BuildArch: noarch
|
BuildArch: noarch
|
||||||
%python_subpackages
|
%python_subpackages
|
||||||
|
|
||||||
@ -87,10 +118,7 @@ Python modules, data sets and tutorials supporting research and
|
|||||||
development in Natural Language Processing.
|
development in Natural Language Processing.
|
||||||
|
|
||||||
%prep
|
%prep
|
||||||
%autosetup -p1 -a1 -n %{pyname}-%{version}
|
%autosetup -p1 -a1 -n nltk-%{version}
|
||||||
|
|
||||||
# Remove obsolete scripts
|
|
||||||
rm tools/nltk_term_index.py tools/run_doctests.py nltk_data/corpora/semcor/semcor.py
|
|
||||||
|
|
||||||
# Fix EOL
|
# Fix EOL
|
||||||
sed -i 's/\r/\n/g; s/\n$//' \
|
sed -i 's/\r/\n/g; s/\n$//' \
|
||||||
@ -120,14 +148,13 @@ sed -E -i "s|#![[:space:]]*%{_bindir}/env python|#!%{_bindir}/python3|" \
|
|||||||
setup.py \
|
setup.py \
|
||||||
tools/global_replace.py \
|
tools/global_replace.py \
|
||||||
nltk_data/corpora/pl196x/splitter.py \
|
nltk_data/corpora/pl196x/splitter.py \
|
||||||
tools/find_deprecated.py \
|
tools/find_deprecated.py
|
||||||
tools/svnmime.py
|
|
||||||
|
|
||||||
%build
|
%build
|
||||||
%python_build
|
%pyproject_wheel
|
||||||
|
|
||||||
%install
|
%install
|
||||||
%python_install
|
%pyproject_install
|
||||||
%python_clone -a %{buildroot}%{_bindir}/nltk
|
%python_clone -a %{buildroot}%{_bindir}/nltk
|
||||||
|
|
||||||
%{python_expand %fdupes %{buildroot}%{$python_sitelib}/
|
%{python_expand %fdupes %{buildroot}%{$python_sitelib}/
|
||||||
@ -148,8 +175,8 @@ export NLTK_DATA=$(readlink -f ./nltk_data/)
|
|||||||
%files %{python_files}
|
%files %{python_files}
|
||||||
%doc README.md
|
%doc README.md
|
||||||
%license LICENSE.txt
|
%license LICENSE.txt
|
||||||
%{python_sitelib}/%{pyname}/
|
%{python_sitelib}/nltk/
|
||||||
%{python_sitelib}/%{pyname}-%{version}-py%{python_version}.egg-info/
|
%{python_sitelib}/nltk-%{version}.dist-info/
|
||||||
%python_alternative %{_bindir}/nltk
|
%python_alternative %{_bindir}/nltk
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
Loading…
Reference in New Issue
Block a user