Accepting request 862684 from devel:languages:python

- Add no-cloudscraper.patch to avoid need to use cloudscraper - Update to 3.28.0: - **Disable adapter_fanfictionnet with warning about site blocking.** - Catch exception from emails not decoding, skip & logger.error(). - Add a fake get_image_size() method for when no image processing available. Closes #621 (CLI only) - Change adapter_twilightednet to https - Change for adapter_fanfictionnetadapter_fanfictionnet to make skip_author_cover work again. - Make included certifi and requests use same tmp file code and store under calibre tmp dir for cleanup. - Add append_datepublished_to_storyurl option for storiesonline.net, finestories.com, scifistories.com only. OBS-URL: https://build.opensuse.org/request/show/862684 OBS-URL: https://build.opensuse.org/package/show/openSUSE:Factory/python-fanficfare?expand=0&rev=28
2021-01-13 17:23:13 +00:00 · 2021-01-13 17:23:13 +00:00 · 13e29fd864
commit 13e29fd864
parent 53187106ca aaf5253968
5 changed files with 247 additions and 6 deletions
--- a/FanFicFare-3.27.0.tar.gz
+++ b/FanFicFare-3.27.0.tar.gz
--- a/FanFicFare-3.28.0.tar.gz
+++ b/FanFicFare-3.28.0.tar.gz
--- a/no-cloudscraper.patch
+++ b/no-cloudscraper.patch
@ -0,0 +1,216 @@
 --- a/fanficfare/configurable.py
 +++ b/fanficfare/configurable.py
@@ -44,7 +44,6 @@ import pickle
 ## isn't found in plugin when only imported down below inside
 ## get_scraper()
 -import cloudscraper
 from . import exceptions
@@ -210,7 +209,6 @@ def get_valid_set_options():
                'titlepage_use_table':(None,None,boollist),
                'use_ssl_unverified_context':(None,None,boollist),
 -               'use_cloudscraper':(None,None,boollist),
                'continue_on_chapter_error':(None,None,boollist),
                'conditionals_use_lists':(None,None,boollist),
                'dedup_chapter_list':(None,None,boollist),
@@ -483,7 +481,6 @@ def get_valid_keywords():
                  'tweak_fg_sleep',
                  'universe_as_series',
                  'use_ssl_unverified_context',
 -                 'use_cloudscraper',
                  'user_agent',
                  'username',
                  'website_encodings',
@@ -598,16 +595,11 @@ class Configuration(ConfigParser):
         self.override_sleep = None
         self.cookiejar = self.get_empty_cookiejar()
         self.opener = build_opener(HTTPCookieProcessor(self.cookiejar),GZipProcessor())
 -        self.scraper = None
         self.pagecache = self.get_empty_pagecache()
         self.save_cache_file = None
         self.save_cookiejar_file = None
 -    def __del__(self):
 -        if self.scraper is not None:
 -            self.scraper.close()
 -
     def section_url_names(self,domain,section_url_f):
         ## domain is passed as a method to limit the damage if/when an
         ## adapter screws up _section_url
@@ -1073,24 +1065,6 @@ class Configuration(ConfigParser):
                 logger.warning("reduce_zalgo failed(%s), continuing."%e)
         return data
 -    def get_scraper(self):
 -        if not self.scraper:
 -            ## ffnet adapter can't parse mobile output, so we only
 -            ## want desktop browser.  But cloudscraper then insists on
 -            ## a browser and platform, too.
 -            self.scraper = cloudscraper.CloudScraper(browser={
 -                    'browser': 'chrome',
 -                    'platform': 'windows',
 -                    'mobile': False,
 -                    'desktop': True,
 -                    })
 -            ## CloudScraper is subclass of requests.Session.
 -            ## probably need import higher up if ever used.
 -            # import requests
 -            # self.scraper = requests.Session()
 -            self.scraper.cookies = self.cookiejar
 -        return self.scraper
 -
     # Assumes application/x-www-form-urlencoded.  parameters, headers are dict()s
     def _postUrl(self, url,
                  parameters={},
@@ -1132,24 +1106,15 @@ class Configuration(ConfigParser):
         #     headers['Authorization']=b"Basic %s" % base64string
         #     logger.debug("http login for SB xf2test")
 -        if self.getConfig('use_cloudscraper',False):
 -            logger.debug("Using cloudscraper for POST")
 -            resp = self.get_scraper().post(url,
 -                                           headers=dict(headers),
 -                                           data=parameters)
 -            logger.debug("response code:%s"%resp.status_code)
 -            resp.raise_for_status() # raises HTTPError if error code.
 -            data = resp.content
 -        else:
 -            req = Request(url,
 -                          data=ensure_binary(urlencode(parameters)),
 -                          headers=headers)
 -
 -            ## Specific UA because too many sites are blocking the default python UA.
 -            self.opener.addheaders = [('User-Agent', self.getConfig('user_agent')),
 -                                      ('X-Clacks-Overhead','GNU Terry Pratchett')]
 +        req = Request(url,
 +                      data=ensure_binary(urlencode(parameters)),
 +                      headers=headers)
 +
 +        ## Specific UA because too many sites are blocking the default python UA.
 +        self.opener.addheaders = [('User-Agent', self.getConfig('user_agent')),
 +                                  ('X-Clacks-Overhead','GNU Terry Pratchett')]
 -            data = self.opener.open(req,None,float(self.getConfig('connect_timeout',30.0))).read()
 +        data = self.opener.open(req,None,float(self.getConfig('connect_timeout',30.0))).read()
         data = self._do_reduce_zalgo(self._decode(data))
         self._progressbar()
         ## postURL saves data to the pagecache *after* _decode() while
@@ -1227,37 +1192,16 @@ class Configuration(ConfigParser):
         self.opener.addheaders = headers
 -        if self.getConfig('use_cloudscraper',False):
 -            ## requests / cloudscraper wants a dict() for headers, not
 -            ## list of tuples.
 -            headers = dict(headers)
 -            ## let cloudscraper do its thing with UA.
 -            if 'User-Agent' in headers:
 -                del headers['User-Agent']
 -            if parameters != None:
 -                logger.debug("Using cloudscraper for fetch POST")
 -                resp = self.get_scraper().post(url,
 -                                               headers=headers,
 -                                               data=parameters)
 -            else:
 -                logger.debug("Using cloudscraper for GET")
 -                resp = self.get_scraper().get(url,
 -                                              headers=headers)
 -            logger.debug("response code:%s"%resp.status_code)
 -            resp.raise_for_status() # raises HTTPError if error code.
 -            data = resp.content
 -            opened = FakeOpened(data,resp.url)
 +        ## opener.open() will to POST with params(data) and GET without.
 +        if parameters != None:
 +            opened = self.opener.open(url,
 +                                      ensure_binary(urlencode(parameters)),
 +                                      float(self.getConfig('connect_timeout',30.0)))
         else:
 -            ## opener.open() will to POST with params(data) and GET without.
 -            if parameters != None:
 -                opened = self.opener.open(url,
 -                                          ensure_binary(urlencode(parameters)),
 -                                          float(self.getConfig('connect_timeout',30.0)))
 -            else:
 -                opened = self.opener.open(url,
 -                                          None,
 -                                          float(self.getConfig('connect_timeout',30.0)))
 -            data = opened.read()
 +            opened = self.opener.open(url,
 +                                      None,
 +                                      float(self.getConfig('connect_timeout',30.0)))
 +        data = opened.read()
         self._progressbar()
         ## postURL saves data to the pagecache *after* _decode() while
         ## fetchRaw saves it *before* _decode()--because raw.
 --- a/fanficfare/defaults.ini
 +++ b/fanficfare/defaults.ini
@@ -2793,15 +2793,6 @@ type_label:Type of Couple
 website_encodings:Windows-1252,utf8
 [www.fanfiction.net]
 -## Using cloudscraper can satisfy the first couple levels of
 -## Cloudflare bot-proofing, but not all levels.  Older versions of
 -## OpenSSL will also raise problems, so versions of Calibre older than
 -## v5 will probably fail.  Only fanfiction.net and fictionpress.com
 -## are configured with use_cloudscraper:true by default, but it can be
 -## applied in other sites' ini sections.  user_agent setting is
 -## ignored when use_cloudscraper:true
 -use_cloudscraper:true
 -
 ## fanfiction.net's 'cover' images are really just tiny thumbnails.
 ## Set this to true to never use them.
 #never_make_cover: false
@@ -2888,15 +2879,6 @@ website_encodings:Windows-1252,utf8
 slow_down_sleep_time:10
 [www.fictionpress.com]
 -## Using cloudscraper can satisfy the first couple levels of
 -## Cloudflare bot-proofing, but not all levels.  Older versions of
 -## OpenSSL will also raise problems, so versions of Calibre older than
 -## v5 will probably fail.  Only fanfiction.net and fictionpress.com
 -## are configured with use_cloudscraper:true by default, but it can be
 -## applied in other sites' ini sections.  user_agent setting is
 -## ignored when use_cloudscraper:true
 -use_cloudscraper:true
 -
 ## Clear FanFiction from defaults, fictionpress.com is original fiction.
 extratags:
 --- a/makeplugin.py
 +++ b/makeplugin.py
@@ -23,7 +23,7 @@ from makezip import createZipFile
 if __name__=="__main__":
     filename="FanFicFare.zip"
     exclude=['*.pyc','*~','*.xcf','*[0-9].png','*.po','*.pot','*default.mo','*Thumbs.db']
 -    
 +
     os.chdir('calibre-plugin')
     files=['plugin-defaults.ini','plugin-example.ini','about.html',
            'images','translations']
@@ -35,8 +35,8 @@ if __name__=="__main__":
                   exclude=exclude)
     os.chdir('../included_dependencies')
 -    files=['bs4','chardet','html2text','soupsieve','backports',
 -           'cloudscraper','requests','requests_toolbelt','urllib3',
 +    files=['bs4', 'chardet', 'html2text', 'soupsieve', 'backports',
 +           'requests', 'requests_toolbelt', 'urllib3',
            'certifi','idna']
     ## Kept only for v2.85.1 support now.
     createZipFile("../"+filename,"a",
 --- a/setup.py
 +++ b/setup.py
@@ -84,8 +84,7 @@ setup(
     install_requires=['beautifulsoup4',
                       'chardet',
                       'html5lib',
 -                      'html2text',
 -                      'cloudscraper'],
 +                      'html2text'],
     # html5lib requires 'six', FFF includes it's own copy as fanficfare.six
     # List additional groups of dependencies here (e.g. development
--- a/python-fanficfare.changes
+++ b/python-fanficfare.changes
@ -1,3 +1,26 @@
 -------------------------------------------------------------------
 Tue Jan 12 16:12:03 UTC 2021 - Matej Cepl <mcepl@suse.com>
 - Add no-cloudscraper.patch to avoid need to use cloudscraper
 -------------------------------------------------------------------
 Mon Jan 11 17:28:41 CET 2021 - Matej Cepl <mcepl@suse.com>
 - Update to 3.28.0:
  - **Disable adapter_fanfictionnet with warning about site
    blocking.**
  - Catch exception from emails not decoding, skip
    & logger.error().
  - Add a fake get_image_size() method for when no image
    processing available. Closes #621 (CLI only)
  - Change adapter_twilightednet to https
  - Change for adapter_fanfictionnetadapter_fanfictionnet to make
    skip_author_cover work again.
  - Make included certifi and requests use same tmp file code and
    store under calibre tmp dir for cleanup.
  - Add append_datepublished_to_storyurl option for
    storiesonline.net, finestories.com, scifistories.com only.
 -------------------------------------------------------------------
 Thu Dec 24 16:17:00 UTC 2020 - Matej Cepl <mcepl@suse.com>
--- a/python-fanficfare.spec
+++ b/python-fanficfare.spec
@ -1,7 +1,7 @@
 #
 # spec file for package python-fanficfare
 #
-# Copyright (c) 2020 SUSE LLC
+# Copyright (c) 2021 SUSE LLC
 #
 # All modifications and additions to the file contributed by third parties
 # remain the property of their copyright owners, unless otherwise agreed
@ -21,7 +21,7 @@
 %define skip_python2 1
 %{?!python_module:%define python_module() python-%{**} python3-%{**}}
 Name:           python-fanficfare
-Version:        3.27.0
+Version:        3.28.0
 Release:        0
 Summary:        Tool for making eBooks from stories on fanfiction and other web sites
 License:        GPL-3.0-only
@ -29,6 +29,9 @@ Group:          Development/Languages/Python
 URL:            https://github.com/JimmXinu/FanFicFare
 Source:         https://github.com/JimmXinu/%{modname}/archive/v%{version}/%{modname}-%{version}.tar.gz
 # Source:         %%{modname}-%%{version}.tar.gz
 # PATCH-FEATURE-OPENSUSE no-cloudscraper.patch mcepl@suse.com
 # don't use cloudscraper
 Patch0:         no-cloudscraper.patch
 BuildRequires:  %{python_module beautifulsoup4}
 BuildRequires:  %{python_module chardet}
 BuildRequires:  %{python_module html2text}
@ -39,7 +42,6 @@ BuildRequires:  fdupes
 BuildRequires:  python-rpm-macros
 Requires:       python-beautifulsoup4
 Requires:       python-chardet
 Requires:       python-cloudscraper
 Requires:       python-html2text
 Requires:       python-html5lib
 Requires:       python-setuptools