--- /tmp/python-scrapy-2.4.1-2xvd7ib4g/debian/python-scrapy-doc_2.4.1-2_all.deb
+++ python-scrapy-doc_2.4.1-2_all.deb
├── file list
│ @@ -1,3 +1,3 @@
│  -rw-r--r--   0        0        0        4 2021-02-28 13:55:45.000000 debian-binary
│ --rw-r--r--   0        0        0     4448 2021-02-28 13:55:45.000000 control.tar.xz
│ --rw-r--r--   0        0        0   705632 2021-02-28 13:55:45.000000 data.tar.xz
│ +-rw-r--r--   0        0        0     4452 2021-02-28 13:55:45.000000 control.tar.xz
│ +-rw-r--r--   0        0        0   705636 2021-02-28 13:55:45.000000 data.tar.xz
├── control.tar.xz
│ ├── control.tar
│ │ ├── ./md5sums
│ │ │ ├── ./md5sums
│ │ │ │┄ Files differ
├── data.tar.xz
│ ├── data.tar
│ │ ├── file list
│ │ │ @@ -108,68 +108,68 @@
│ │ │  -rw-r--r--   0 root         (0) root         (0)      286 2021-01-01 06:53:29.000000 ./usr/share/doc/python-scrapy-doc/html/_static/file.png
│ │ │  drwxr-xr-x   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/fonts/
│ │ │  drwxr-xr-x   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/js/
│ │ │  -rw-r--r--   0 root         (0) root         (0)       90 2021-01-01 06:53:29.000000 ./usr/share/doc/python-scrapy-doc/html/_static/minus.png
│ │ │  -rw-r--r--   0 root         (0) root         (0)       90 2021-01-01 06:53:29.000000 ./usr/share/doc/python-scrapy-doc/html/_static/plus.png
│ │ │  -rw-r--r--   0 root         (0) root         (0)     4780 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/pygments.css
│ │ │  -rw-r--r--   0 root         (0) root         (0)      565 2020-11-17 08:17:39.000000 ./usr/share/doc/python-scrapy-doc/html/_static/selectors-sample1.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    32989 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/contributing.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    32939 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/contributing.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    50670 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/faq.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)   137972 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/genindex.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    23359 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/index.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    23362 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/index.html
│ │ │  drwxr-xr-x   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/
│ │ │  -rw-r--r--   0 root         (0) root         (0)    12411 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/examples.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    31635 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/install.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    31638 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/install.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    25231 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/overview.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   105318 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/tutorial.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   585427 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/news.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   105319 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/intro/tutorial.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   585323 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/news.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    10648 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/objects.inv
│ │ │  -rw-r--r--   0 root         (0) root         (0)    24710 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/py-modindex.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    10845 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/search.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)   138454 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/searchindex.js
│ │ │  drwxr-xr-x   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/
│ │ │ --rw-r--r--   0 root         (0) root         (0)    89936 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/api.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    89965 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/api.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    23358 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/architecture.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    15445 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/asyncio.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    15450 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/asyncio.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    24881 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/autothrottle.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    35950 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/benchmarking.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    26798 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/broad-crawls.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    50712 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/commands.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    27486 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/contracts.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    22778 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/coroutines.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    27489 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/contracts.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    22782 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/coroutines.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    22971 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/debug.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    14338 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/deploy.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    40217 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/developer-tools.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    40219 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/developer-tools.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    10691 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/djangoitem.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   128699 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/downloader-middleware.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    34910 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/dynamic-content.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    27924 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/email.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    22833 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/exceptions.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    61382 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/exporters.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    46172 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/extensions.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    66777 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/feed-exports.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   128705 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/downloader-middleware.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    34915 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/dynamic-content.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    27942 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/email.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    22835 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/exceptions.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    61402 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/exporters.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    46173 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/extensions.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    66784 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/feed-exports.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    38849 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/item-pipeline.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    51228 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/items.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    18263 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/jobs.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    38396 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/leaks.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    33102 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/link-extractors.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    90564 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/loaders.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    51625 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/logging.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    51241 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/items.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    18264 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/jobs.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    38398 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/leaks.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    33124 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/link-extractors.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    90575 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/loaders.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    51634 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/logging.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    76821 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/media-pipeline.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    35808 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/practices.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   148643 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/request-response.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   148687 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/request-response.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    10666 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/scrapyd.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   143947 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/selectors.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   156017 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/settings.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   143948 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/selectors.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   156025 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/settings.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    42964 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/shell.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    60320 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/signals.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    66288 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/spider-middleware.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)   106067 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/spiders.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    60322 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/signals.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    66289 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/spider-middleware.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)   106071 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/spiders.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    20627 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/stats.html
│ │ │ --rw-r--r--   0 root         (0) root         (0)    25389 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/telnetconsole.html
│ │ │ +-rw-r--r--   0 root         (0) root         (0)    25391 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/telnetconsole.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    11355 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/topics/webservice.html
│ │ │  -rw-r--r--   0 root         (0) root         (0)    14450 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/versioning.html
│ │ │  drwxr-xr-x   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc-base/
│ │ │  -rw-r--r--   0 root         (0) root         (0)      491 2021-02-28 13:55:45.000000 ./usr/share/doc-base/python-scrapy-doc
│ │ │  lrwxrwxrwx   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/css/badge_only.css -> ../../../../../sphinx_rtd_theme/static/css/badge_only.css
│ │ │  lrwxrwxrwx   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/css/theme.css -> ../../../../../sphinx_rtd_theme/static/css/theme.css
│ │ │  lrwxrwxrwx   0 root         (0) root         (0)        0 2021-02-28 13:55:45.000000 ./usr/share/doc/python-scrapy-doc/html/_static/doctools.js -> ../../../../javascript/sphinxdoc/1.0/doctools.js
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/contributing.html
│ │ │ @@ -369,72 +369,72 @@
│ │ │  setup instructions.</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="documentation-policies">
│ │ │  <span id="id4"></span><h2>Documentation policies<a class="headerlink" href="#documentation-policies" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>For reference documentation of API members (classes, methods, etc.) use
│ │ │  docstrings and make sure that the Sphinx documentation uses the
│ │ │ -<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html#module-sphinx.ext.autodoc" title="(in Sphinx v4.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">autodoc</span></code></a> extension to pull the docstrings. API reference
│ │ │ +<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html#module-sphinx.ext.autodoc" title="(in Sphinx v5.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">autodoc</span></code></a> extension to pull the docstrings. API reference
│ │ │  documentation should follow docstring conventions (<a class="reference external" href="https://www.python.org/dev/peps/pep-0257/">PEP 257</a>) and be
│ │ │  IDE-friendly: short, to the point, and it may provide short examples.</p>
│ │ │  <p>Other types of documentation, such as tutorials or topics, should be covered in
│ │ │  files within the <code class="docutils literal notranslate"><span class="pre">docs/</span></code> directory. This includes documentation that is
│ │ │  specific to an API member, but goes beyond API reference documentation.</p>
│ │ │  <p>In any case, if something is covered in a docstring, use the
│ │ │ -<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html#module-sphinx.ext.autodoc" title="(in Sphinx v4.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">autodoc</span></code></a> extension to pull the docstring into the
│ │ │ +<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html#module-sphinx.ext.autodoc" title="(in Sphinx v5.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">autodoc</span></code></a> extension to pull the docstring into the
│ │ │  documentation instead of duplicating the docstring in files within the
│ │ │  <code class="docutils literal notranslate"><span class="pre">docs/</span></code> directory.</p>
│ │ │  <p>Documentation updates that cover new or modified features must use Sphinx’s
│ │ │ -<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionadded" title="(in Sphinx v4.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionadded</span></code></a> and <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionchanged" title="(in Sphinx v4.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionchanged</span></code></a> directives. Use
│ │ │ +<a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionadded" title="(in Sphinx v5.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionadded</span></code></a> and <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionchanged" title="(in Sphinx v5.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionchanged</span></code></a> directives. Use
│ │ │  <code class="docutils literal notranslate"><span class="pre">VERSION</span></code> as version, we will replace it with the actual version right before
│ │ │  the corresponding release. When we release a new major or minor version of
│ │ │  Scrapy, we remove these directives if they are older than 3 years.</p>
│ │ │  <p>Documentation about deprecated features must be removed as those features are
│ │ │  deprecated, so that new readers do not run into it. New deprecations and
│ │ │  deprecation removals are documented in the <a class="reference internal" href="news.html#news"><span class="std std-ref">release notes</span></a>.</p>
│ │ │  </div>
│ │ │  <div class="section" id="tests">
│ │ │  <h2>Tests<a class="headerlink" href="#tests" title="Permalink to this headline">¶</a></h2>
│ │ │ -<p>Tests are implemented using the <a class="reference external" href="https://twistedmatrix.com/documents/current/core/development/policy/test-standard.html" title="(in Twisted v20.3)"><span class="xref std std-doc">Twisted unit-testing framework</span></a>. Running tests requires
│ │ │ -<a class="reference external" href="https://tox.readthedocs.io/en/latest/index.html" title="(in tox v3.22)"><span class="xref std std-doc">tox</span></a>.</p>
│ │ │ +<p>Tests are implemented using the <a class="reference external" href="https://twistedmatrix.com/documents/current/core/development/policy/test-standard.html" title="(in Twisted v21.2)"><span class="xref std std-doc">Twisted unit-testing framework</span></a>. Running tests requires
│ │ │ +<a class="reference external" href="https://tox.wiki/en/latest/index.html" title="(in tox v3.24)"><span class="xref std std-doc">tox</span></a>.</p>
│ │ │  <div class="section" id="running-tests">
│ │ │  <span id="id5"></span><h3>Running tests<a class="headerlink" href="#running-tests" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>To run all tests:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">tox</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>To run a specific test (say <code class="docutils literal notranslate"><span class="pre">tests/test_loader.py</span></code>) use:</p>
│ │ │  <blockquote>
│ │ │  <div><p><code class="docutils literal notranslate"><span class="pre">tox</span> <span class="pre">--</span> <span class="pre">tests/test_loader.py</span></code></p>
│ │ │  </div></blockquote>
│ │ │ -<p>To run the tests on a specific <a class="reference external" href="https://tox.readthedocs.io/en/latest/index.html" title="(in tox v3.22)"><span class="xref std std-doc">tox</span></a> environment, use
│ │ │ +<p>To run the tests on a specific <a class="reference external" href="https://tox.wiki/en/latest/index.html" title="(in tox v3.24)"><span class="xref std std-doc">tox</span></a> environment, use
│ │ │  <code class="docutils literal notranslate"><span class="pre">-e</span> <span class="pre">&lt;name&gt;</span></code> with an environment name from <code class="docutils literal notranslate"><span class="pre">tox.ini</span></code>. For example, to run
│ │ │  the tests with Python 3.6 use:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">tox</span> <span class="o">-</span><span class="n">e</span> <span class="n">py36</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ -<p>You can also specify a comma-separated list of environments, and use <a class="reference external" href="https://tox.readthedocs.io/en/latest/example/basic.html#parallel-mode" title="(in tox v3.22)"><span class="xref std std-ref">tox’s
│ │ │ +<p>You can also specify a comma-separated list of environments, and use <a class="reference external" href="https://tox.wiki/en/latest/example/basic.html#parallel-mode" title="(in tox v3.24)"><span class="xref std std-ref">tox’s
│ │ │  parallel mode</span></a> to run the tests on multiple environments in
│ │ │  parallel:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">tox</span> <span class="o">-</span><span class="n">e</span> <span class="n">py36</span><span class="p">,</span><span class="n">py38</span> <span class="o">-</span><span class="n">p</span> <span class="n">auto</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ -<p>To pass command-line options to <a class="reference external" href="https://docs.pytest.org/en/latest/index.html" title="(in pytest v0.1.dev207+gcd783eb)"><span class="xref std std-doc">pytest</span></a>, add them after
│ │ │ -<code class="docutils literal notranslate"><span class="pre">--</span></code> in your call to <a class="reference external" href="https://tox.readthedocs.io/en/latest/index.html" title="(in tox v3.22)"><span class="xref std std-doc">tox</span></a>. Using <code class="docutils literal notranslate"><span class="pre">--</span></code> overrides the
│ │ │ +<p>To pass command-line options to <a class="reference external" href="https://docs.pytest.org/en/latest/index.html" title="(in pytest v0.1.dev242+g4b417ac)"><span class="xref std std-doc">pytest</span></a>, add them after
│ │ │ +<code class="docutils literal notranslate"><span class="pre">--</span></code> in your call to <a class="reference external" href="https://tox.wiki/en/latest/index.html" title="(in tox v3.24)"><span class="xref std std-doc">tox</span></a>. Using <code class="docutils literal notranslate"><span class="pre">--</span></code> overrides the
│ │ │  default positional arguments defined in <code class="docutils literal notranslate"><span class="pre">tox.ini</span></code>, so you must include those
│ │ │  default positional arguments (<code class="docutils literal notranslate"><span class="pre">scrapy</span> <span class="pre">tests</span></code>) after <code class="docutils literal notranslate"><span class="pre">--</span></code> as well:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">tox</span> <span class="o">--</span> <span class="n">scrapy</span> <span class="n">tests</span> <span class="o">-</span><span class="n">x</span>  <span class="c1"># stop after first failure</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>You can also use the <a class="reference external" href="https://github.com/pytest-dev/pytest-xdist">pytest-xdist</a> plugin. For example, to run all tests on
│ │ │ -the Python 3.6 <a class="reference external" href="https://tox.readthedocs.io/en/latest/index.html" title="(in tox v3.22)"><span class="xref std std-doc">tox</span></a> environment using all your CPU cores:</p>
│ │ │ +the Python 3.6 <a class="reference external" href="https://tox.wiki/en/latest/index.html" title="(in tox v3.24)"><span class="xref std std-doc">tox</span></a> environment using all your CPU cores:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">tox</span> <span class="o">-</span><span class="n">e</span> <span class="n">py36</span> <span class="o">--</span> <span class="n">scrapy</span> <span class="n">tests</span> <span class="o">-</span><span class="n">n</span> <span class="n">auto</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ -<p>To see coverage report install <a class="reference external" href="https://coverage.readthedocs.io/en/stable/index.html" title="(in Coverage.py v5.4)"><span class="xref std std-doc">coverage</span></a>
│ │ │ +<p>To see coverage report install <a class="reference external" href="https://coverage.readthedocs.io/en/stable/index.html" title="(in Coverage.py v6.0)"><span class="xref std std-doc">coverage</span></a>
│ │ │  (<code class="docutils literal notranslate"><span class="pre">pip</span> <span class="pre">install</span> <span class="pre">coverage</span></code>) and run:</p>
│ │ │  <blockquote>
│ │ │  <div><p><code class="docutils literal notranslate"><span class="pre">coverage</span> <span class="pre">report</span></code></p>
│ │ │  </div></blockquote>
│ │ │  <p>see output of <code class="docutils literal notranslate"><span class="pre">coverage</span> <span class="pre">--help</span></code> for more options like html or xml report.</p>
│ │ │  </div>
│ │ │  <div class="section" id="writing-tests">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/index.html
│ │ │ @@ -323,17 +323,17 @@
│ │ │  </dd>
│ │ │  <dt><a class="reference internal" href="topics/autothrottle.html"><span class="doc">AutoThrottle extension</span></a></dt><dd><p>Adjust crawl rate dynamically based on load.</p>
│ │ │  </dd>
│ │ │  <dt><a class="reference internal" href="topics/benchmarking.html"><span class="doc">Benchmarking</span></a></dt><dd><p>Check how Scrapy performs on your hardware.</p>
│ │ │  </dd>
│ │ │  <dt><a class="reference internal" href="topics/jobs.html"><span class="doc">Jobs: pausing and resuming crawls</span></a></dt><dd><p>Learn how to pause and resume crawls for large spiders.</p>
│ │ │  </dd>
│ │ │ -<dt><a class="reference internal" href="topics/coroutines.html"><span class="doc">Coroutines</span></a></dt><dd><p>Use the <a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.9)"><span class="xref std std-ref">coroutine syntax</span></a>.</p>
│ │ │ +<dt><a class="reference internal" href="topics/coroutines.html"><span class="doc">Coroutines</span></a></dt><dd><p>Use the <a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.10)"><span class="xref std std-ref">coroutine syntax</span></a>.</p>
│ │ │  </dd>
│ │ │ -<dt><a class="reference internal" href="topics/asyncio.html"><span class="doc">asyncio</span></a></dt><dd><p>Use <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries.</p>
│ │ │ +<dt><a class="reference internal" href="topics/asyncio.html"><span class="doc">asyncio</span></a></dt><dd><p>Use <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries.</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </div>
│ │ │  <div class="section" id="extending-scrapy">
│ │ │  <span id="id1"></span><h2>Extending Scrapy<a class="headerlink" href="#extending-scrapy" title="Permalink to this headline">¶</a></h2>
│ │ │  <div class="toctree-wrapper compound">
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/intro/install.html
│ │ │ @@ -235,15 +235,15 @@
│ │ │             <div itemprop="articleBody">
│ │ │              
│ │ │    <div class="section" id="installation-guide">
│ │ │  <span id="intro-install"></span><h1>Installation guide<a class="headerlink" href="#installation-guide" title="Permalink to this headline">¶</a></h1>
│ │ │  <div class="section" id="supported-python-versions">
│ │ │  <span id="faq-python-versions"></span><h2>Supported Python versions<a class="headerlink" href="#supported-python-versions" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Scrapy requires Python 3.6+, either the CPython implementation (default) or
│ │ │ -the PyPy 7.2.0+ implementation (see <a class="reference external" href="https://docs.python.org/3/reference/introduction.html#implementations" title="(in Python v3.9)"><span>Alternate Implementations</span></a>).</p>
│ │ │ +the PyPy 7.2.0+ implementation (see <a class="reference external" href="https://docs.python.org/3/reference/introduction.html#implementations" title="(in Python v3.10)"><span>Alternate Implementations</span></a>).</p>
│ │ │  </div>
│ │ │  <div class="section" id="installing-scrapy">
│ │ │  <h2>Installing Scrapy<a class="headerlink" href="#installing-scrapy" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>If you’re using <a class="reference external" href="https://docs.anaconda.com/anaconda/">Anaconda</a> or <a class="reference external" href="https://docs.conda.io/projects/conda/en/latest/user-guide/install/index.html">Miniconda</a>, you can install the package from
│ │ │  the <a class="reference external" href="https://conda-forge.org/">conda-forge</a> channel, which has up-to-date packages for Linux, Windows
│ │ │  and macOS.</p>
│ │ │  <p>To install Scrapy using <code class="docutils literal notranslate"><span class="pre">conda</span></code>, run:</p>
│ │ │ @@ -294,19 +294,19 @@
│ │ │  <div class="section" id="using-a-virtual-environment-recommended">
│ │ │  <span id="intro-using-virtualenv"></span><h3>Using a virtual environment (recommended)<a class="headerlink" href="#using-a-virtual-environment-recommended" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>TL;DR: We recommend installing Scrapy inside a virtual environment
│ │ │  on all platforms.</p>
│ │ │  <p>Python packages can be installed either globally (a.k.a system wide),
│ │ │  or in user-space. We do not recommend installing Scrapy system wide.</p>
│ │ │  <p>Instead, we recommend that you install Scrapy within a so-called
│ │ │ -“virtual environment” (<a class="reference external" href="https://docs.python.org/3/library/venv.html#module-venv" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">venv</span></code></a>).
│ │ │ +“virtual environment” (<a class="reference external" href="https://docs.python.org/3/library/venv.html#module-venv" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">venv</span></code></a>).
│ │ │  Virtual environments allow you to not conflict with already-installed Python
│ │ │  system packages (which could break some of your system tools and scripts),
│ │ │  and still install packages normally with <code class="docutils literal notranslate"><span class="pre">pip</span></code> (without <code class="docutils literal notranslate"><span class="pre">sudo</span></code> and the likes).</p>
│ │ │ -<p>See <a class="reference external" href="https://docs.python.org/3/tutorial/venv.html#tut-venv" title="(in Python v3.9)"><span>Virtual Environments and Packages</span></a> on how to create your virtual environment.</p>
│ │ │ +<p>See <a class="reference external" href="https://docs.python.org/3/tutorial/venv.html#tut-venv" title="(in Python v3.10)"><span>Virtual Environments and Packages</span></a> on how to create your virtual environment.</p>
│ │ │  <p>Once you have created a virtual environment, you can install Scrapy inside it with <code class="docutils literal notranslate"><span class="pre">pip</span></code>,
│ │ │  just like any other Python package.
│ │ │  (See <a class="reference internal" href="#intro-install-platform-notes"><span class="std std-ref">platform-specific guides</span></a>
│ │ │  below for non-Python dependencies that you may need to install beforehand).</p>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="platform-specific-installation-notes">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/intro/tutorial.html
│ │ │ @@ -489,15 +489,15 @@
│ │ │  find any element matching the selection.</p>
│ │ │  <p>There’s a lesson here: for most scraping code, you want it to be resilient to
│ │ │  errors due to things not being found on a page, so that even if some parts fail
│ │ │  to be scraped, you can at least get <strong>some</strong> data.</p>
│ │ │  <p>Besides the <a class="reference internal" href="../topics/selectors.html#scrapy.selector.SelectorList.getall" title="scrapy.selector.SelectorList.getall"><code class="xref py py-meth docutils literal notranslate"><span class="pre">getall()</span></code></a> and
│ │ │  <a class="reference internal" href="../topics/selectors.html#scrapy.selector.SelectorList.get" title="scrapy.selector.SelectorList.get"><code class="xref py py-meth docutils literal notranslate"><span class="pre">get()</span></code></a> methods, you can also use
│ │ │  the <a class="reference internal" href="../topics/selectors.html#scrapy.selector.SelectorList.re" title="scrapy.selector.SelectorList.re"><code class="xref py py-meth docutils literal notranslate"><span class="pre">re()</span></code></a> method to extract using
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.9)"><span class="xref std std-doc">regular expressions</span></a>:</p>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.10)"><span class="xref std std-doc">regular expressions</span></a>:</p>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;title::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">re</span><span class="p">(</span><span class="sa">r</span><span class="s1">&#39;Quotes.*&#39;</span><span class="p">)</span>
│ │ │  <span class="go">[&#39;Quotes to Scrape&#39;]</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;title::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">re</span><span class="p">(</span><span class="sa">r</span><span class="s1">&#39;Q\w+&#39;</span><span class="p">)</span>
│ │ │  <span class="go">[&#39;Quotes&#39;]</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;title::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">re</span><span class="p">(</span><span class="sa">r</span><span class="s1">&#39;(\w+) to (\w+)&#39;</span><span class="p">)</span>
│ │ │  <span class="go">[&#39;Quotes&#39;, &#39;Scrape&#39;]</span>
│ │ │  </pre></div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/news.html
│ │ │ @@ -715,31 +715,31 @@
│ │ │  <a class="reference internal" href="topics/extensions.html#scrapy.extensions.closespider.CloseSpider" title="scrapy.extensions.closespider.CloseSpider"><code class="xref py py-class docutils literal notranslate"><span class="pre">CloseSpider</span></code></a> extension
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4836">issue 4836</a>)</p></li>
│ │ │  <li><p>Removed references to Python 2’s <code class="docutils literal notranslate"><span class="pre">unicode</span></code> type (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4547">issue 4547</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4703">issue 4703</a>)</p></li>
│ │ │  <li><p>We now have an <a class="reference internal" href="versioning.html#deprecation-policy"><span class="std std-ref">official deprecation policy</span></a>
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4705">issue 4705</a>)</p></li>
│ │ │  <li><p>Our <a class="reference internal" href="contributing.html#documentation-policies"><span class="std std-ref">documentation policies</span></a> now cover usage
│ │ │ -of Sphinx’s <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionadded" title="(in Sphinx v4.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionadded</span></code></a> and <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionchanged" title="(in Sphinx v4.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionchanged</span></code></a>
│ │ │ +of Sphinx’s <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionadded" title="(in Sphinx v5.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionadded</span></code></a> and <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/restructuredtext/directives.html#directive-versionchanged" title="(in Sphinx v5.0.0+)"><code class="xref rst rst-dir docutils literal notranslate"><span class="pre">versionchanged</span></code></a>
│ │ │  directives, and we have removed usages referencing Scrapy 1.4.0 and earlier
│ │ │  versions (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3971">issue 3971</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4310">issue 4310</a>)</p></li>
│ │ │  <li><p>Other documentation cleanups (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4090">issue 4090</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4782">issue 4782</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4800">issue 4800</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4801">issue 4801</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4809">issue 4809</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4816">issue 4816</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4825">issue 4825</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="quality-assurance">
│ │ │  <h3>Quality assurance<a class="headerlink" href="#quality-assurance" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p>Extended typing hints (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4243">issue 4243</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4691">issue 4691</a>)</p></li>
│ │ │  <li><p>Added tests for the <a class="reference internal" href="topics/commands.html#std-command-check"><code class="xref std std-command docutils literal notranslate"><span class="pre">check</span></code></a> command (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4663">issue 4663</a>)</p></li>
│ │ │  <li><p>Fixed test failures on Debian (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4726">issue 4726</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4727">issue 4727</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4735">issue 4735</a>)</p></li>
│ │ │  <li><p>Improved Windows test coverage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4723">issue 4723</a>)</p></li>
│ │ │ -<li><p>Switched to <a class="reference external" href="https://docs.python.org/3/reference/lexical_analysis.html#f-strings" title="(in Python v3.9)"><span class="xref std std-ref">formatted string literals</span></a> where possible
│ │ │ +<li><p>Switched to <a class="reference external" href="https://docs.python.org/3/reference/lexical_analysis.html#f-strings" title="(in Python v3.10)"><span class="xref std std-ref">formatted string literals</span></a> where possible
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4307">issue 4307</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4324">issue 4324</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4672">issue 4672</a>)</p></li>
│ │ │ -<li><p>Modernized <a class="reference external" href="https://docs.python.org/3/library/functions.html#super" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">super()</span></code></a> usage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4707">issue 4707</a>)</p></li>
│ │ │ +<li><p>Modernized <code class="xref py py-func docutils literal notranslate"><span class="pre">super()</span></code> usage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4707">issue 4707</a>)</p></li>
│ │ │  <li><p>Other code and test cleanups (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/1790">issue 1790</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3288">issue 3288</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4165">issue 4165</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4564">issue 4564</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4651">issue 4651</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4714">issue 4714</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4738">issue 4738</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4745">issue 4745</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4747">issue 4747</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4761">issue 4761</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4765">issue 4765</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4804">issue 4804</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4817">issue 4817</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4820">issue 4820</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4822">issue 4822</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4839">issue 4839</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  </div>
│ │ │ @@ -864,15 +864,15 @@
│ │ │  <li><p><a class="reference internal" href="topics/downloader-middleware.html#scrapy.downloadermiddlewares.cookies.CookiesMiddleware" title="scrapy.downloadermiddlewares.cookies.CookiesMiddleware"><code class="xref py py-class docutils literal notranslate"><span class="pre">CookiesMiddleware</span></code></a> fixes</p></li>
│ │ │  </ul>
│ │ │  <div class="section" id="id7">
│ │ │  <h3>Backward-incompatible changes<a class="headerlink" href="#id7" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p>Support for Python 3.5.0 and 3.5.1 has been dropped; Scrapy now refuses to
│ │ │  run with a Python version lower than 3.5.2, which introduced
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Type" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">typing.Type</span></code></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4615">issue 4615</a>)</p></li>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Type" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">typing.Type</span></code></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4615">issue 4615</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id8">
│ │ │  <h3>Deprecations<a class="headerlink" href="#id8" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p><code class="xref py py-meth docutils literal notranslate"><span class="pre">TextResponse.body_as_unicode</span></code> is now deprecated, use
│ │ │  <a class="reference internal" href="topics/request-response.html#scrapy.http.TextResponse.text" title="scrapy.http.TextResponse.text"><code class="xref py py-attr docutils literal notranslate"><span class="pre">TextResponse.text</span></code></a> instead
│ │ │ @@ -899,45 +899,45 @@
│ │ │  not downloaded; see <a class="reference internal" href="topics/media-pipeline.html#scrapy.pipelines.files.FilesPipeline.get_media_requests" title="scrapy.pipelines.files.FilesPipeline.get_media_requests"><code class="xref py py-meth docutils literal notranslate"><span class="pre">FilesPipeline.get_media_requests</span></code></a> for more
│ │ │  information (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/2893">issue 2893</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4486">issue 4486</a>)</p></li>
│ │ │  <li><p>When using <a class="reference internal" href="topics/media-pipeline.html#media-pipeline-gcs"><span class="std std-ref">Google Cloud Storage</span></a> for
│ │ │  a <a class="reference internal" href="topics/media-pipeline.html#topics-media-pipeline"><span class="std std-ref">media pipeline</span></a>, a warning is now logged if
│ │ │  the configured credentials do not grant the required permissions
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4346">issue 4346</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4508">issue 4508</a>)</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/link-extractors.html#topics-link-extractors"><span class="std std-ref">Link extractors</span></a> are now serializable,
│ │ │ -as long as you do not use <a class="reference external" href="https://docs.python.org/3/reference/expressions.html#lambda" title="(in Python v3.9)"><span class="xref std std-ref">lambdas</span></a> for parameters; for
│ │ │ +as long as you do not use <a class="reference external" href="https://docs.python.org/3/reference/expressions.html#lambda" title="(in Python v3.10)"><span class="xref std std-ref">lambdas</span></a> for parameters; for
│ │ │  example, you can now pass link extractors in <a class="reference internal" href="topics/request-response.html#scrapy.http.Request.cb_kwargs" title="scrapy.http.Request.cb_kwargs"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.cb_kwargs</span></code></a> or
│ │ │  <a class="reference internal" href="topics/request-response.html#scrapy.http.Request.meta" title="scrapy.http.Request.meta"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.meta</span></code></a> when <a class="reference internal" href="topics/jobs.html#topics-jobs"><span class="std std-ref">persisting
│ │ │  scheduled requests</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4554">issue 4554</a>)</p></li>
│ │ │ -<li><p>Upgraded the <a class="reference external" href="https://docs.python.org/3/library/pickle.html#pickle-protocols" title="(in Python v3.9)"><span class="xref std std-ref">pickle protocol</span></a> that Scrapy uses
│ │ │ +<li><p>Upgraded the <a class="reference external" href="https://docs.python.org/3/library/pickle.html#pickle-protocols" title="(in Python v3.10)"><span class="xref std std-ref">pickle protocol</span></a> that Scrapy uses
│ │ │  from protocol 2 to protocol 4, improving serialization capabilities and
│ │ │  performance (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4135">issue 4135</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4541">issue 4541</a>)</p></li>
│ │ │ -<li><p><code class="xref py py-func docutils literal notranslate"><span class="pre">scrapy.utils.misc.create_instance()</span></code> now raises a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a>
│ │ │ +<li><p><code class="xref py py-func docutils literal notranslate"><span class="pre">scrapy.utils.misc.create_instance()</span></code> now raises a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a>
│ │ │  exception if the resulting instance is <code class="docutils literal notranslate"><span class="pre">None</span></code> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4528">issue 4528</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4532">issue 4532</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id10">
│ │ │  <h3>Bug fixes<a class="headerlink" href="#id10" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p><a class="reference internal" href="topics/downloader-middleware.html#scrapy.downloadermiddlewares.cookies.CookiesMiddleware" title="scrapy.downloadermiddlewares.cookies.CookiesMiddleware"><code class="xref py py-class docutils literal notranslate"><span class="pre">CookiesMiddleware</span></code></a> no longer
│ │ │  discards cookies defined in <a class="reference internal" href="topics/request-response.html#scrapy.http.Request.headers" title="scrapy.http.Request.headers"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.headers</span></code></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/1992">issue 1992</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/2400">issue 2400</a>)</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/downloader-middleware.html#scrapy.downloadermiddlewares.cookies.CookiesMiddleware" title="scrapy.downloadermiddlewares.cookies.CookiesMiddleware"><code class="xref py py-class docutils literal notranslate"><span class="pre">CookiesMiddleware</span></code></a> no longer
│ │ │ -re-encodes cookies defined as <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> in the <code class="docutils literal notranslate"><span class="pre">cookies</span></code> parameter
│ │ │ +re-encodes cookies defined as <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> in the <code class="docutils literal notranslate"><span class="pre">cookies</span></code> parameter
│ │ │  of the <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method of <a class="reference internal" href="topics/request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a>
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/2400">issue 2400</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3575">issue 3575</a>)</p></li>
│ │ │  <li><p>When <a class="reference internal" href="topics/feed-exports.html#std-setting-FEEDS"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEEDS</span></code></a> defines multiple URIs, <a class="reference internal" href="topics/feed-exports.html#std-setting-FEED_STORE_EMPTY"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_STORE_EMPTY</span></code></a> is
│ │ │  <code class="docutils literal notranslate"><span class="pre">False</span></code> and the crawl yields no items, Scrapy no longer stops feed
│ │ │  exports after the first URI (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4621">issue 4621</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4626">issue 4626</a>)</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> callbacks defined using <a class="reference internal" href="topics/coroutines.html"><span class="doc">coroutine
│ │ │  syntax</span></a> no longer need to return an iterable, and may
│ │ │  instead return a <a class="reference internal" href="topics/request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> object, an
│ │ │  <a class="reference internal" href="topics/items.html#topics-items"><span class="std std-ref">item</span></a>, or <code class="docutils literal notranslate"><span class="pre">None</span></code> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4609">issue 4609</a>)</p></li>
│ │ │  <li><p>The <a class="reference internal" href="topics/commands.html#std-command-startproject"><code class="xref std std-command docutils literal notranslate"><span class="pre">startproject</span></code></a> command now ensures that the generated project
│ │ │  folders and files have the right permissions (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4604">issue 4604</a>)</p></li>
│ │ │ -<li><p>Fix a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#KeyError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">KeyError</span></code></a> exception being sometimes raised from
│ │ │ +<li><p>Fix a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#KeyError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">KeyError</span></code></a> exception being sometimes raised from
│ │ │  <code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.utils.datatypes.LocalWeakReferencedCache</span></code> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4597">issue 4597</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4599">issue 4599</a>)</p></li>
│ │ │  <li><p>When <a class="reference internal" href="topics/feed-exports.html#std-setting-FEEDS"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEEDS</span></code></a> defines multiple URIs, log messages about items being
│ │ │  stored now contain information from the corresponding feed, instead of
│ │ │  always containing information about only one of the feeds (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4619">issue 4619</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4629">issue 4629</a>)</p></li>
│ │ │  </ul>
│ │ │ @@ -946,15 +946,15 @@
│ │ │  <h3>Documentation<a class="headerlink" href="#id11" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p>Added a new section about <a class="reference internal" href="topics/request-response.html#errback-cb-kwargs"><span class="std std-ref">accessing cb_kwargs from errbacks</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4598">issue 4598</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4634">issue 4634</a>)</p></li>
│ │ │  <li><p>Covered <a class="reference external" href="https://github.com/Nykakin/chompjs">chompjs</a> in <a class="reference internal" href="topics/dynamic-content.html#topics-parsing-javascript"><span class="std std-ref">Parsing JavaScript code</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4556">issue 4556</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4562">issue 4562</a>)</p></li>
│ │ │  <li><p>Removed from <a class="reference internal" href="topics/coroutines.html"><span class="doc">Coroutines</span></a> the warning about the API being
│ │ │  experimental (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4511">issue 4511</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4513">issue 4513</a>)</p></li>
│ │ │ -<li><p>Removed references to unsupported versions of <a class="reference external" href="https://twistedmatrix.com/documents/current/index.html" title="(in Twisted v20.3)"><span class="xref std std-doc">Twisted</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4533">issue 4533</a>)</p></li>
│ │ │ +<li><p>Removed references to unsupported versions of <a class="reference external" href="https://twistedmatrix.com/documents/current/index.html" title="(in Twisted v21.2)"><span class="xref std std-doc">Twisted</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4533">issue 4533</a>)</p></li>
│ │ │  <li><p>Updated the description of the <a class="reference internal" href="topics/item-pipeline.html#screenshotpipeline"><span class="std std-ref">screenshot pipeline example</span></a>, which now uses <a class="reference internal" href="topics/coroutines.html"><span class="doc">coroutine syntax</span></a> instead of returning a
│ │ │  <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.defer.Deferred.html" title="(in Twisted v2.0)"><code class="xref py py-class docutils literal notranslate"><span class="pre">Deferred</span></code></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4514">issue 4514</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4593">issue 4593</a>)</p></li>
│ │ │  <li><p>Removed a misleading import line from the
│ │ │  <a class="reference internal" href="topics/logging.html#scrapy.utils.log.configure_logging" title="scrapy.utils.log.configure_logging"><code class="xref py py-func docutils literal notranslate"><span class="pre">scrapy.utils.log.configure_logging()</span></code></a> code example (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4510">issue 4510</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4587">issue 4587</a>)</p></li>
│ │ │  <li><p>The display-on-hover behavior of internal documentation references now also
│ │ │  covers links to <a class="reference internal" href="topics/commands.html#topics-commands"><span class="std std-ref">commands</span></a>, <a class="reference internal" href="topics/request-response.html#scrapy.http.Request.meta" title="scrapy.http.Request.meta"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.meta</span></code></a> keys, <a class="reference internal" href="topics/settings.html#topics-settings"><span class="std std-ref">settings</span></a> and
│ │ │ @@ -974,15 +974,15 @@
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4572">issue 4572</a>)</p></li>
│ │ │  <li><p>Removed remnants of Python 2 support (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4550">issue 4550</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4553">issue 4553</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4568">issue 4568</a>)</p></li>
│ │ │  <li><p>Improved code sharing between the <a class="reference internal" href="topics/commands.html#std-command-crawl"><code class="xref std std-command docutils literal notranslate"><span class="pre">crawl</span></code></a> and <a class="reference internal" href="topics/commands.html#std-command-runspider"><code class="xref std std-command docutils literal notranslate"><span class="pre">runspider</span></code></a>
│ │ │  commands (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4548">issue 4548</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4552">issue 4552</a>)</p></li>
│ │ │  <li><p>Replaced <code class="docutils literal notranslate"><span class="pre">chain(*iterable)</span></code> with <code class="docutils literal notranslate"><span class="pre">chain.from_iterable(iterable)</span></code>
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4635">issue 4635</a>)</p></li>
│ │ │ -<li><p>You may now run the <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> tests with Tox on any Python version
│ │ │ +<li><p>You may now run the <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> tests with Tox on any Python version
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4521">issue 4521</a>)</p></li>
│ │ │  <li><p>Updated test requirements to reflect an incompatibility with pytest 5.4 and
│ │ │  5.4.1 (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4588">issue 4588</a>)</p></li>
│ │ │  <li><p>Improved <a class="reference internal" href="topics/api.html#scrapy.spiderloader.SpiderLoader" title="scrapy.spiderloader.SpiderLoader"><code class="xref py py-class docutils literal notranslate"><span class="pre">SpiderLoader</span></code></a> test coverage for
│ │ │  scenarios involving duplicate spider names (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4549">issue 4549</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4560">issue 4560</a>)</p></li>
│ │ │  <li><p>Configured Travis CI to also run the tests with Python 3.5.2
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4518">issue 4518</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4615">issue 4615</a>)</p></li>
│ │ │ @@ -1001,19 +1001,19 @@
│ │ │  <ul class="simple">
│ │ │  <li><p>New <a class="reference internal" href="topics/feed-exports.html#std-setting-FEEDS"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEEDS</span></code></a> setting to export to multiple feeds</p></li>
│ │ │  <li><p>New <a class="reference internal" href="topics/request-response.html#scrapy.http.Response.ip_address" title="scrapy.http.Response.ip_address"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Response.ip_address</span></code></a> attribute</p></li>
│ │ │  </ul>
│ │ │  <div class="section" id="id13">
│ │ │  <h3>Backward-incompatible changes<a class="headerlink" href="#id13" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul>
│ │ │ -<li><p><a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AssertionError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AssertionError</span></code></a> exceptions triggered by <a class="reference external" href="https://docs.python.org/3/reference/simple_stmts.html#assert" title="(in Python v3.9)"><span class="xref std std-ref">assert</span></a>
│ │ │ +<li><p><a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AssertionError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AssertionError</span></code></a> exceptions triggered by <a class="reference external" href="https://docs.python.org/3/reference/simple_stmts.html#assert" title="(in Python v3.10)"><span class="xref std std-ref">assert</span></a>
│ │ │  statements have been replaced by new exception types, to support running
│ │ │ -Python in optimized mode (see <a class="reference external" href="https://docs.python.org/3/using/cmdline.html#cmdoption-o" title="(in Python v3.9)"><code class="xref std std-option docutils literal notranslate"><span class="pre">-O</span></code></a>) without changing Scrapy’s
│ │ │ +Python in optimized mode (see <a class="reference external" href="https://docs.python.org/3/using/cmdline.html#cmdoption-O" title="(in Python v3.10)"><code class="xref std std-option docutils literal notranslate"><span class="pre">-O</span></code></a>) without changing Scrapy’s
│ │ │  behavior in any unexpected ways.</p>
│ │ │ -<p>If you catch an <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AssertionError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AssertionError</span></code></a> exception from Scrapy, update your
│ │ │ +<p>If you catch an <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AssertionError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AssertionError</span></code></a> exception from Scrapy, update your
│ │ │  code to catch the corresponding new exception.</p>
│ │ │  <p>(<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4440">issue 4440</a>)</p>
│ │ │  </li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id14">
│ │ │  <h3>Deprecation removals<a class="headerlink" href="#id14" title="Permalink to this headline">¶</a></h3>
│ │ │ @@ -1065,15 +1065,15 @@
│ │ │  <div class="section" id="id17">
│ │ │  <h3>Bug fixes<a class="headerlink" href="#id17" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p><a class="reference internal" href="topics/jobs.html#request-serialization"><span class="std std-ref">Request serialization</span></a> no longer breaks for
│ │ │  callbacks that are spider attributes which are assigned a function with a
│ │ │  different name (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4500">issue 4500</a>)</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">None</span></code> values in <a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider.allowed_domains" title="scrapy.spiders.Spider.allowed_domains"><code class="xref py py-attr docutils literal notranslate"><span class="pre">allowed_domains</span></code></a> no longer
│ │ │ -cause a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4410">issue 4410</a>)</p></li>
│ │ │ +cause a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4410">issue 4410</a>)</p></li>
│ │ │  <li><p>Zsh completion no longer allows options after arguments (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4438">issue 4438</a>)</p></li>
│ │ │  <li><p>zope.interface 5.0.0 and later versions are now supported
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4447">issue 4447</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4448">issue 4448</a>)</p></li>
│ │ │  <li><p><code class="xref py py-meth docutils literal notranslate"><span class="pre">Spider.make_requests_from_url</span></code>, deprecated in Scrapy
│ │ │  1.4.0, now issues a warning when used (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4412">issue 4412</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │ @@ -1099,15 +1099,15 @@
│ │ │  <h3>Quality assurance<a class="headerlink" href="#id19" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │  <li><p>Removed warnings about using old, removed settings (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4404">issue 4404</a>)</p></li>
│ │ │  <li><p>Removed a warning about importing
│ │ │  <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.testing.StringTransport.html" title="(in Twisted v2.0)"><code class="xref py py-class docutils literal notranslate"><span class="pre">StringTransport</span></code></a> from
│ │ │  <code class="docutils literal notranslate"><span class="pre">twisted.test.proto_helpers</span></code> in Twisted 19.7.0 or newer (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4409">issue 4409</a>)</p></li>
│ │ │  <li><p>Removed outdated Debian package build files (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4384">issue 4384</a>)</p></li>
│ │ │ -<li><p>Removed <a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">object</span></code></a> usage as a base class (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4430">issue 4430</a>)</p></li>
│ │ │ +<li><p>Removed <a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">object</span></code></a> usage as a base class (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4430">issue 4430</a>)</p></li>
│ │ │  <li><p>Removed code that added support for old versions of Twisted that we no
│ │ │  longer support (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4472">issue 4472</a>)</p></li>
│ │ │  <li><p>Fixed code style issues (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4468">issue 4468</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4469">issue 4469</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4471">issue 4471</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4481">issue 4481</a>)</p></li>
│ │ │  <li><p>Removed <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.defer.html#returnValue" title="(in Twisted v2.0)"><code class="xref py py-func docutils literal notranslate"><span class="pre">twisted.internet.defer.returnValue()</span></code></a> calls (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4443">issue 4443</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4446">issue 4446</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4489">issue 4489</a>)</p></li>
│ │ │  </ul>
│ │ │ @@ -1126,16 +1126,16 @@
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="scrapy-2-0-0-2020-03-03">
│ │ │  <span id="release-2-0-0"></span><h2>Scrapy 2.0.0 (2020-03-03)<a class="headerlink" href="#scrapy-2-0-0-2020-03-03" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Highlights:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>Python 2 support has been removed</p></li>
│ │ │ -<li><p><a class="reference internal" href="topics/coroutines.html"><span class="doc">Partial</span></a> <a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.9)"><span class="xref std std-ref">coroutine syntax</span></a> support
│ │ │ -and <a class="reference internal" href="topics/asyncio.html"><span class="doc">experimental</span></a> <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support</p></li>
│ │ │ +<li><p><a class="reference internal" href="topics/coroutines.html"><span class="doc">Partial</span></a> <a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.10)"><span class="xref std std-ref">coroutine syntax</span></a> support
│ │ │ +and <a class="reference internal" href="topics/asyncio.html"><span class="doc">experimental</span></a> <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support</p></li>
│ │ │  <li><p>New <a class="reference internal" href="topics/request-response.html#scrapy.http.Response.follow_all" title="scrapy.http.Response.follow_all"><code class="xref py py-meth docutils literal notranslate"><span class="pre">Response.follow_all</span></code></a> method</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/media-pipeline.html#media-pipeline-ftp"><span class="std std-ref">FTP support</span></a> for media pipelines</p></li>
│ │ │  <li><p>New <a class="reference internal" href="topics/request-response.html#scrapy.http.Response.certificate" title="scrapy.http.Response.certificate"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Response.certificate</span></code></a>
│ │ │  attribute</p></li>
│ │ │  <li><p>IPv6 support through <a class="reference internal" href="topics/settings.html#std-setting-DNS_RESOLVER"><code class="xref std std-setting docutils literal notranslate"><span class="pre">DNS_RESOLVER</span></code></a></p></li>
│ │ │  </ul>
│ │ │  <div class="section" id="id20">
│ │ │ @@ -1197,22 +1197,22 @@
│ │ │  is deprecated (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4300">issue 4300</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4374">issue 4374</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4375">issue 4375</a>)</p></li>
│ │ │  <li><p><code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.linkextractors.FilteringLinkExtractor</span></code> is deprecated, use
│ │ │  <a class="reference internal" href="topics/link-extractors.html#scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor" title="scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor"><code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.linkextractors.LinkExtractor</span></code></a> instead (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4045">issue 4045</a>)</p></li>
│ │ │  <li><p>The <code class="docutils literal notranslate"><span class="pre">noconnect</span></code> query string argument of proxy URLs is deprecated and
│ │ │  should be removed from proxy URLs (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4198">issue 4198</a>)</p></li>
│ │ │  <li><p>The <code class="xref py py-meth docutils literal notranslate"><span class="pre">next</span></code> method of
│ │ │  <code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.utils.python.MutableChain</span></code> is deprecated, use the global
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/functions.html#next" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">next()</span></code></a> function or <code class="xref py py-meth docutils literal notranslate"><span class="pre">MutableChain.__next__</span></code> instead (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4153">issue 4153</a>)</p></li>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/functions.html#next" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">next()</span></code></a> function or <code class="xref py py-meth docutils literal notranslate"><span class="pre">MutableChain.__next__</span></code> instead (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4153">issue 4153</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id23">
│ │ │  <h3>New features<a class="headerlink" href="#id23" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul>
│ │ │  <li><p>Added <a class="reference internal" href="topics/coroutines.html"><span class="doc">partial support</span></a> for Python’s
│ │ │ -<a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.9)"><span class="xref std std-ref">coroutine syntax</span></a> and <a class="reference internal" href="topics/asyncio.html"><span class="doc">experimental support</span></a> for <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries
│ │ │ +<a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.10)"><span class="xref std std-ref">coroutine syntax</span></a> and <a class="reference internal" href="topics/asyncio.html"><span class="doc">experimental support</span></a> for <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4010">issue 4010</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4259">issue 4259</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4269">issue 4269</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4270">issue 4270</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4271">issue 4271</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4316">issue 4316</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4318">issue 4318</a>)</p></li>
│ │ │  <li><p>The new <a class="reference internal" href="topics/request-response.html#scrapy.http.Response.follow_all" title="scrapy.http.Response.follow_all"><code class="xref py py-meth docutils literal notranslate"><span class="pre">Response.follow_all</span></code></a>
│ │ │  method offers the same functionality as
│ │ │  <a class="reference internal" href="topics/request-response.html#scrapy.http.Response.follow" title="scrapy.http.Response.follow"><code class="xref py py-meth docutils literal notranslate"><span class="pre">Response.follow</span></code></a> but supports an
│ │ │  iterable of URLs as input and returns an iterable of requests
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/2582">issue 2582</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4057">issue 4057</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4286">issue 4286</a>)</p></li>
│ │ │ @@ -1253,22 +1253,22 @@
│ │ │  <li><p><a class="reference internal" href="topics/logging.html#scrapy.logformatter.LogFormatter.item_error" title="scrapy.logformatter.LogFormatter.item_error"><code class="xref py py-class docutils literal notranslate"><span class="pre">item_error</span></code></a> for exceptions
│ │ │  raised during item processing by <a class="reference internal" href="topics/item-pipeline.html#topics-item-pipeline"><span class="std std-ref">item pipelines</span></a></p></li>
│ │ │  <li><p><a class="reference internal" href="topics/logging.html#scrapy.logformatter.LogFormatter.spider_error" title="scrapy.logformatter.LogFormatter.spider_error"><code class="xref py py-class docutils literal notranslate"><span class="pre">spider_error</span></code></a> for exceptions
│ │ │  raised from <a class="reference internal" href="topics/spiders.html#topics-spiders"><span class="std std-ref">spider callbacks</span></a></p></li>
│ │ │  </ul>
│ │ │  <p>(<a class="reference external" href="https://github.com/scrapy/scrapy/issues/374">issue 374</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3986">issue 3986</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3989">issue 3989</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4176">issue 4176</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4188">issue 4188</a>)</p>
│ │ │  </li>
│ │ │ -<li><p>The <code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_URI</span></code> setting now supports <a class="reference external" href="https://docs.python.org/3/library/pathlib.html#pathlib.Path" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">pathlib.Path</span></code></a> values
│ │ │ +<li><p>The <code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_URI</span></code> setting now supports <a class="reference external" href="https://docs.python.org/3/library/pathlib.html#pathlib.Path" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">pathlib.Path</span></code></a> values
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3731">issue 3731</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4074">issue 4074</a>)</p></li>
│ │ │  <li><p>A new <a class="reference internal" href="topics/signals.html#std-signal-request_left_downloader"><code class="xref std std-signal docutils literal notranslate"><span class="pre">request_left_downloader</span></code></a> signal is sent when a request
│ │ │  leaves the downloader (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4303">issue 4303</a>)</p></li>
│ │ │  <li><p>Scrapy logs a warning when it detects a request callback or errback that
│ │ │  uses <code class="docutils literal notranslate"><span class="pre">yield</span></code> but also returns a value, since the returned value would be
│ │ │  lost (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3484">issue 3484</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3869">issue 3869</a>)</p></li>
│ │ │ -<li><p><a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> objects now raise an <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AttributeError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AttributeError</span></code></a>
│ │ │ +<li><p><a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> objects now raise an <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#AttributeError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">AttributeError</span></code></a>
│ │ │  exception if they do not have a <a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider.start_urls" title="scrapy.spiders.Spider.start_urls"><code class="xref py py-class docutils literal notranslate"><span class="pre">start_urls</span></code></a>
│ │ │  attribute nor reimplement <a class="reference internal" href="topics/spiders.html#scrapy.spiders.Spider.start_requests" title="scrapy.spiders.Spider.start_requests"><code class="xref py py-class docutils literal notranslate"><span class="pre">start_requests</span></code></a>,
│ │ │  but have a <code class="docutils literal notranslate"><span class="pre">start_url</span></code> attribute (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4133">issue 4133</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4170">issue 4170</a>)</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/exporters.html#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> subclasses may now use
│ │ │  <code class="docutils literal notranslate"><span class="pre">super().__init__(**kwargs)</span></code> instead of <code class="docutils literal notranslate"><span class="pre">self._configure(kwargs)</span></code> in
│ │ │  their <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, passing <code class="docutils literal notranslate"><span class="pre">dont_fail=True</span></code> to the parent
│ │ │  <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method if needed, and accessing <code class="docutils literal notranslate"><span class="pre">kwargs</span></code> at <code class="docutils literal notranslate"><span class="pre">self._kwargs</span></code>
│ │ │ @@ -1306,17 +1306,17 @@
│ │ │  <li><p><code class="xref py py-class docutils literal notranslate"><span class="pre">RFPDupeFilter</span></code>, the default
│ │ │  <a class="reference internal" href="topics/settings.html#std-setting-DUPEFILTER_CLASS"><code class="xref std std-setting docutils literal notranslate"><span class="pre">DUPEFILTER_CLASS</span></code></a>, no longer writes an extra <code class="docutils literal notranslate"><span class="pre">\r</span></code> character on
│ │ │  each line in Windows, which made the size of the <code class="docutils literal notranslate"><span class="pre">requests.seen</span></code> file
│ │ │  unnecessarily large on that platform (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4283">issue 4283</a>)</p></li>
│ │ │  <li><p>Z shell auto-completion now looks for <code class="docutils literal notranslate"><span class="pre">.html</span></code> files, not <code class="docutils literal notranslate"><span class="pre">.http</span></code> files,
│ │ │  and covers the <code class="docutils literal notranslate"><span class="pre">-h</span></code> command-line switch (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4122">issue 4122</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4291">issue 4291</a>)</p></li>
│ │ │  <li><p>Adding items to a <code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.utils.datatypes.LocalCache</span></code> object
│ │ │ -without a <code class="docutils literal notranslate"><span class="pre">limit</span></code> defined no longer raises a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception
│ │ │ +without a <code class="docutils literal notranslate"><span class="pre">limit</span></code> defined no longer raises a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4123">issue 4123</a>)</p></li>
│ │ │ -<li><p>Fixed a typo in the message of the <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#ValueError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">ValueError</span></code></a> exception raised when
│ │ │ +<li><p>Fixed a typo in the message of the <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#ValueError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">ValueError</span></code></a> exception raised when
│ │ │  <code class="xref py py-func docutils literal notranslate"><span class="pre">scrapy.utils.misc.create_instance()</span></code> gets both <code class="docutils literal notranslate"><span class="pre">settings</span></code> and
│ │ │  <code class="docutils literal notranslate"><span class="pre">crawler</span></code> set to <code class="docutils literal notranslate"><span class="pre">None</span></code> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4128">issue 4128</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id25">
│ │ │  <h3>Documentation<a class="headerlink" href="#id25" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ │ @@ -1326,15 +1326,15 @@
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4152">issue 4152</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4169">issue 4169</a>)</p></li>
│ │ │  <li><p>Cross-references within our documentation now display a tooltip when
│ │ │  hovered (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4173">issue 4173</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4183">issue 4183</a>)</p></li>
│ │ │  <li><p>Improved the documentation about <a class="reference internal" href="topics/link-extractors.html#scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor.extract_links" title="scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor.extract_links"><code class="xref py py-meth docutils literal notranslate"><span class="pre">LinkExtractor.extract_links</span></code></a> and
│ │ │  simplified <a class="reference internal" href="topics/link-extractors.html#topics-link-extractors"><span class="std std-ref">Link Extractors</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4045">issue 4045</a>)</p></li>
│ │ │  <li><p>Clarified how <a class="reference internal" href="topics/loaders.html#scrapy.loader.ItemLoader.item" title="scrapy.loader.ItemLoader.item"><code class="xref py py-class docutils literal notranslate"><span class="pre">ItemLoader.item</span></code></a>
│ │ │  works (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3574">issue 3574</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4099">issue 4099</a>)</p></li>
│ │ │ -<li><p>Clarified that <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> should not be used when also
│ │ │ +<li><p>Clarified that <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> should not be used when also
│ │ │  using <a class="reference internal" href="topics/api.html#scrapy.crawler.CrawlerProcess" title="scrapy.crawler.CrawlerProcess"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerProcess</span></code></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/2149">issue 2149</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/2352">issue 2352</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3146">issue 3146</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3960">issue 3960</a>)</p></li>
│ │ │  <li><p>Clarified the requirements for <a class="reference internal" href="topics/request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> objects
│ │ │  <a class="reference internal" href="topics/jobs.html#request-serialization"><span class="std std-ref">when using persistence</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4124">issue 4124</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4139">issue 4139</a>)</p></li>
│ │ │  <li><p>Clarified how to install a <a class="reference internal" href="topics/media-pipeline.html#media-pipeline-example"><span class="std std-ref">custom image pipeline</span></a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4034">issue 4034</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4252">issue 4252</a>)</p></li>
│ │ │  <li><p>Fixed the signatures of the <code class="docutils literal notranslate"><span class="pre">file_path</span></code> method in <a class="reference internal" href="topics/media-pipeline.html#topics-media-pipeline"><span class="std std-ref">media pipeline</span></a> examples (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4290">issue 4290</a>)</p></li>
│ │ │ @@ -1348,15 +1348,15 @@
│ │ │  <li><p>Fixed logic issues, broken links and typos (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4247">issue 4247</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4258">issue 4258</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4282">issue 4282</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4288">issue 4288</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4305">issue 4305</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4308">issue 4308</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4323">issue 4323</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4338">issue 4338</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4359">issue 4359</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4361">issue 4361</a>)</p></li>
│ │ │  <li><p>Improved consistency when referring to the <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method of an object
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4086">issue 4086</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4088">issue 4088</a>)</p></li>
│ │ │  <li><p>Fixed an inconsistency between code and output in <a class="reference internal" href="intro/overview.html#intro-overview"><span class="std std-ref">Scrapy at a glance</span></a>
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4213">issue 4213</a>)</p></li>
│ │ │ -<li><p>Extended <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/intersphinx.html#module-sphinx.ext.intersphinx" title="(in Sphinx v4.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">intersphinx</span></code></a> usage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4147">issue 4147</a>,
│ │ │ +<li><p>Extended <a class="reference external" href="https://www.sphinx-doc.org/en/master/usage/extensions/intersphinx.html#module-sphinx.ext.intersphinx" title="(in Sphinx v5.0.0+)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">intersphinx</span></code></a> usage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4147">issue 4147</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4172">issue 4172</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4185">issue 4185</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4194">issue 4194</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4197">issue 4197</a>)</p></li>
│ │ │  <li><p>We now use a recent version of Python to build the documentation
│ │ │  (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4140">issue 4140</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4249">issue 4249</a>)</p></li>
│ │ │  <li><p>Cleaned up documentation (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4143">issue 4143</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4275">issue 4275</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id26">
│ │ │ @@ -1370,15 +1370,15 @@
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4157">issue 4157</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4167">issue 4167</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4174">issue 4174</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4186">issue 4186</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4195">issue 4195</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4238">issue 4238</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4246">issue 4246</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4355">issue 4355</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4360">issue 4360</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4365">issue 4365</a>)</p></li>
│ │ │  <li><p>Improved test coverage (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4097">issue 4097</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4218">issue 4218</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4236">issue 4236</a>)</p></li>
│ │ │  <li><p>Started reporting slowest tests, and improved the performance of some of
│ │ │  them (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4163">issue 4163</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4164">issue 4164</a>)</p></li>
│ │ │  <li><p>Fixed broken tests and refactored some tests (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4014">issue 4014</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4095">issue 4095</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4244">issue 4244</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4268">issue 4268</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4372">issue 4372</a>)</p></li>
│ │ │ -<li><p>Modified the <a class="reference external" href="https://tox.readthedocs.io/en/latest/index.html" title="(in tox v3.22)"><span class="xref std std-doc">tox</span></a> configuration to allow running tests
│ │ │ +<li><p>Modified the <a class="reference external" href="https://tox.wiki/en/latest/index.html" title="(in tox v3.24)"><span class="xref std std-doc">tox</span></a> configuration to allow running tests
│ │ │  with any Python version, run <a class="reference external" href="https://bandit.readthedocs.io/">Bandit</a> and <a class="reference external" href="https://flake8.pycqa.org/en/latest/">Flake8</a> tests by default, and
│ │ │  enforce a minimum tox version programmatically (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4179">issue 4179</a>)</p></li>
│ │ │  <li><p>Cleaned up code (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3937">issue 3937</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4208">issue 4208</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4209">issue 4209</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4210">issue 4210</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4212">issue 4212</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4369">issue 4369</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4376">issue 4376</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4378">issue 4378</a>)</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="changes-to-scheduler-queue-classes">
│ │ │ @@ -1573,15 +1573,15 @@
│ │ │  <ul class="simple">
│ │ │  <li><p><a class="reference internal" href="topics/loaders.html#scrapy.loader.ItemLoader.load_item" title="scrapy.loader.ItemLoader.load_item"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.load_item()</span></code></a> no
│ │ │  longer makes later calls to <a class="reference internal" href="topics/loaders.html#scrapy.loader.ItemLoader.get_output_value" title="scrapy.loader.ItemLoader.get_output_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.get_output_value()</span></code></a> or
│ │ │  <a class="reference internal" href="topics/loaders.html#scrapy.loader.ItemLoader.load_item" title="scrapy.loader.ItemLoader.load_item"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.load_item()</span></code></a> return
│ │ │  empty data (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3804">issue 3804</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3819">issue 3819</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3897">issue 3897</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3976">issue 3976</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3998">issue 3998</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4036">issue 4036</a>)</p></li>
│ │ │  <li><p>Fixed <a class="reference internal" href="topics/stats.html#scrapy.statscollectors.DummyStatsCollector" title="scrapy.statscollectors.DummyStatsCollector"><code class="xref py py-class docutils literal notranslate"><span class="pre">DummyStatsCollector</span></code></a> raising a
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4007">issue 4007</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4052">issue 4052</a>)</p></li>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">TypeError</span></code></a> exception (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/4007">issue 4007</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/4052">issue 4052</a>)</p></li>
│ │ │  <li><p><a class="reference internal" href="topics/media-pipeline.html#scrapy.pipelines.files.FilesPipeline.file_path" title="scrapy.pipelines.files.FilesPipeline.file_path"><code class="xref py py-meth docutils literal notranslate"><span class="pre">FilesPipeline.file_path</span></code></a> and
│ │ │  <a class="reference internal" href="topics/media-pipeline.html#scrapy.pipelines.images.ImagesPipeline.file_path" title="scrapy.pipelines.images.ImagesPipeline.file_path"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ImagesPipeline.file_path</span></code></a> no longer choose
│ │ │  file extensions that are not <a class="reference external" href="https://www.iana.org/assignments/media-types/media-types.xhtml">registered with IANA</a> (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/1287">issue 1287</a>,
│ │ │  <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3953">issue 3953</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3954">issue 3954</a>)</p></li>
│ │ │  <li><p>When using <a class="reference external" href="https://github.com/boto/botocore">botocore</a> to persist files in S3, all botocore-supported headers
│ │ │  are properly mapped now (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3904">issue 3904</a>, <a class="reference external" href="https://github.com/scrapy/scrapy/issues/3905">issue 3905</a>)</p></li>
│ │ │  <li><p>FTP passwords in <code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_URI</span></code> containing percent-escaped characters
│ │ │ @@ -1908,15 +1908,15 @@
│ │ │  <ul>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">scrapy.utils.http</span></code> (use <a class="reference external" href="https://w3lib.readthedocs.io/en/latest/w3lib.html#module-w3lib.http">w3lib.http</a>)</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">scrapy.utils.markup</span></code> (use <a class="reference external" href="https://w3lib.readthedocs.io/en/latest/w3lib.html#module-w3lib.html">w3lib.html</a>)</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">scrapy.utils.multipart</span></code> (use <a class="reference external" href="https://urllib3.readthedocs.io/en/latest/index.html">urllib3</a>)</p></li>
│ │ │  </ul>
│ │ │  </li>
│ │ │  <li><p>The <code class="docutils literal notranslate"><span class="pre">scrapy.utils.datatypes.MergeDict</span></code> class is deprecated for Python 3
│ │ │ -code bases. Use <a class="reference external" href="https://docs.python.org/3/library/collections.html#collections.ChainMap" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ChainMap</span></code></a> instead. (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3878">issue 3878</a>)</p></li>
│ │ │ +code bases. Use <a class="reference external" href="https://docs.python.org/3/library/collections.html#collections.ChainMap" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ChainMap</span></code></a> instead. (<a class="reference external" href="https://github.com/scrapy/scrapy/issues/3878">issue 3878</a>)</p></li>
│ │ │  <li><p>The <code class="docutils literal notranslate"><span class="pre">scrapy.utils.gz.is_gzipped</span></code> function is deprecated. Use
│ │ │  <code class="docutils literal notranslate"><span class="pre">scrapy.utils.gz.gzip_magic_number</span></code> instead.</p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  <div class="section" id="id41">
│ │ │  <h3>Other changes<a class="headerlink" href="#id41" title="Permalink to this headline">¶</a></h3>
│ │ │  <ul class="simple">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/api.html
│ │ │ @@ -465,15 +465,15 @@
│ │ │  <dd><p>This method starts a <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.reactor.html" title="(in Twisted v2.0)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">reactor</span></code></a>, adjusts its pool
│ │ │  size to <a class="reference internal" href="settings.html#std-setting-REACTOR_THREADPOOL_MAXSIZE"><code class="xref std std-setting docutils literal notranslate"><span class="pre">REACTOR_THREADPOOL_MAXSIZE</span></code></a>, and installs a DNS cache
│ │ │  based on <a class="reference internal" href="settings.html#std-setting-DNSCACHE_ENABLED"><code class="xref std std-setting docutils literal notranslate"><span class="pre">DNSCACHE_ENABLED</span></code></a> and <a class="reference internal" href="settings.html#std-setting-DNSCACHE_SIZE"><code class="xref std std-setting docutils literal notranslate"><span class="pre">DNSCACHE_SIZE</span></code></a>.</p>
│ │ │  <p>If <code class="docutils literal notranslate"><span class="pre">stop_after_crawl</span></code> is True, the reactor will be stopped after all
│ │ │  crawlers have finished, using <a class="reference internal" href="#scrapy.crawler.CrawlerProcess.join" title="scrapy.crawler.CrawlerProcess.join"><code class="xref py py-meth docutils literal notranslate"><span class="pre">join()</span></code></a>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>stop_after_crawl</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – stop or not the reactor when all
│ │ │ +<dd class="field-odd"><p><strong>stop_after_crawl</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – stop or not the reactor when all
│ │ │  crawlers have finished</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.crawler.CrawlerProcess.stop">
│ │ │ @@ -589,16 +589,16 @@
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.get">
│ │ │  <code class="sig-name descname">get</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">name</span></em>, <em class="sig-param"><span class="n">default</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.get"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.get" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Get a setting value without affecting its original type.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getbool">
│ │ │ @@ -607,16 +607,16 @@
│ │ │  <p><code class="docutils literal notranslate"><span class="pre">1</span></code>, <code class="docutils literal notranslate"><span class="pre">'1'</span></code>, <cite>True`</cite> and <code class="docutils literal notranslate"><span class="pre">'True'</span></code> return <code class="docutils literal notranslate"><span class="pre">True</span></code>,
│ │ │  while <code class="docutils literal notranslate"><span class="pre">0</span></code>, <code class="docutils literal notranslate"><span class="pre">'0'</span></code>, <code class="docutils literal notranslate"><span class="pre">False</span></code>, <code class="docutils literal notranslate"><span class="pre">'False'</span></code> and <code class="docutils literal notranslate"><span class="pre">None</span></code> return <code class="docutils literal notranslate"><span class="pre">False</span></code>.</p>
│ │ │  <p>For example, settings populated through environment variables set to
│ │ │  <code class="docutils literal notranslate"><span class="pre">'0'</span></code> will return <code class="docutils literal notranslate"><span class="pre">False</span></code> when using this method.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getdict">
│ │ │ @@ -627,44 +627,44 @@
│ │ │  <a class="reference internal" href="#scrapy.settings.BaseSettings" title="scrapy.settings.BaseSettings"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseSettings</span></code></a> instance itself, it will be
│ │ │  converted to a dictionary, containing all its current settings values
│ │ │  as they would be returned by <a class="reference internal" href="#scrapy.settings.BaseSettings.get" title="scrapy.settings.BaseSettings.get"><code class="xref py py-meth docutils literal notranslate"><span class="pre">get()</span></code></a>,
│ │ │  and losing all information about priority and mutability.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getfloat">
│ │ │  <code class="sig-name descname">getfloat</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">name</span></em>, <em class="sig-param"><span class="n">default</span><span class="o">=</span><span class="default_value">0.0</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.getfloat"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.getfloat" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Get a setting value as a float.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getint">
│ │ │  <code class="sig-name descname">getint</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">name</span></em>, <em class="sig-param"><span class="n">default</span><span class="o">=</span><span class="default_value">0</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.getint"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.getint" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Get a setting value as an int.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getlist">
│ │ │ @@ -672,41 +672,41 @@
│ │ │  <dd><p>Get a setting value as a list. If the setting original type is a list, a
│ │ │  copy of it will be returned. If it’s a string it will be split by “,”.</p>
│ │ │  <p>For example, settings populated through environment variables set to
│ │ │  <code class="docutils literal notranslate"><span class="pre">'one,two'</span></code> will return a list [‘one’, ‘two’] when using this method.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>default</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to return if no setting is found</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getpriority">
│ │ │  <code class="sig-name descname">getpriority</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">name</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.getpriority"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.getpriority" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Return the current numerical priority value of a setting, or <code class="docutils literal notranslate"><span class="pre">None</span></code> if
│ │ │  the given <code class="docutils literal notranslate"><span class="pre">name</span></code> does not exist.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p>
│ │ │ +<dd class="field-odd"><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.getwithbase">
│ │ │  <code class="sig-name descname">getwithbase</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">name</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.getwithbase"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.getwithbase" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Get a composition of a dictionary-like setting and its <cite>_BASE</cite>
│ │ │  counterpart.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – name of the dictionary-like setting</p>
│ │ │ +<dd class="field-odd"><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – name of the dictionary-like setting</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.settings.BaseSettings.maxpriority">
│ │ │  <code class="sig-name descname">maxpriority</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/settings.html#BaseSettings.maxpriority"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.settings.BaseSettings.maxpriority" title="Permalink to this definition">¶</a></dt>
│ │ │ @@ -722,17 +722,17 @@
│ │ │  <dd><p>Store a key/value attribute with a given priority.</p>
│ │ │  <p>Settings should be populated <em>before</em> configuring the Crawler object
│ │ │  (through the <code class="xref py py-meth docutils literal notranslate"><span class="pre">configure()</span></code> method),
│ │ │  otherwise they won’t have any effect.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the setting name</p></li>
│ │ │ -<li><p><strong>value</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the value to associate with the setting</p></li>
│ │ │ -<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the priority of the setting. Should be a key of
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the setting name</p></li>
│ │ │ +<li><p><strong>value</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the value to associate with the setting</p></li>
│ │ │ +<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the priority of the setting. Should be a key of
│ │ │  <a class="reference internal" href="#scrapy.settings.SETTINGS_PRIORITIES" title="scrapy.settings.SETTINGS_PRIORITIES"><code class="xref py py-attr docutils literal notranslate"><span class="pre">SETTINGS_PRIORITIES</span></code></a> or an integer</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │ @@ -741,16 +741,16 @@
│ │ │  <dd><p>Store settings from a module with a given priority.</p>
│ │ │  <p>This is a helper function that calls
│ │ │  <a class="reference internal" href="#scrapy.settings.BaseSettings.set" title="scrapy.settings.BaseSettings.set"><code class="xref py py-meth docutils literal notranslate"><span class="pre">set()</span></code></a> for every globally declared
│ │ │  uppercase variable of <code class="docutils literal notranslate"><span class="pre">module</span></code> with the provided <code class="docutils literal notranslate"><span class="pre">priority</span></code>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>module</strong> (<a class="reference external" href="https://docs.python.org/3/library/types.html#types.ModuleType" title="(in Python v3.9)"><em>types.ModuleType</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the module or the path of the module</p></li>
│ │ │ -<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the priority of the settings. Should be a key of
│ │ │ +<li><p><strong>module</strong> (<a class="reference external" href="https://docs.python.org/3/library/types.html#types.ModuleType" title="(in Python v3.10)"><em>types.ModuleType</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the module or the path of the module</p></li>
│ │ │ +<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the priority of the settings. Should be a key of
│ │ │  <a class="reference internal" href="#scrapy.settings.SETTINGS_PRIORITIES" title="scrapy.settings.SETTINGS_PRIORITIES"><code class="xref py py-attr docutils literal notranslate"><span class="pre">SETTINGS_PRIORITIES</span></code></a> or an integer</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │ @@ -766,15 +766,15 @@
│ │ │  will be used and the <code class="docutils literal notranslate"><span class="pre">priority</span></code> parameter ignored. This allows
│ │ │  inserting/updating settings with different priorities with a single
│ │ │  command.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>values</strong> (dict or string or <a class="reference internal" href="#scrapy.settings.BaseSettings" title="scrapy.settings.BaseSettings"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseSettings</span></code></a>) – the settings names and values</p></li>
│ │ │ -<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the priority of the settings. Should be a key of
│ │ │ +<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the priority of the settings. Should be a key of
│ │ │  <a class="reference internal" href="#scrapy.settings.SETTINGS_PRIORITIES" title="scrapy.settings.SETTINGS_PRIORITIES"><code class="xref py py-attr docutils literal notranslate"><span class="pre">SETTINGS_PRIORITIES</span></code></a> or an integer</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </dd></dl>
│ │ │ @@ -809,15 +809,15 @@
│ │ │  <dt id="scrapy.spiderloader.SpiderLoader.load">
│ │ │  <code class="sig-name descname">load</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">spider_name</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/spiderloader.html#SpiderLoader.load"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.spiderloader.SpiderLoader.load" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Get the Spider class with the given name. It’ll look into the previously
│ │ │  loaded spiders for a spider class with name <code class="docutils literal notranslate"><span class="pre">spider_name</span></code> and will raise
│ │ │  a KeyError if not found.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>spider_name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – spider class name</p>
│ │ │ +<dd class="field-odd"><p><strong>spider_name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – spider class name</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.spiderloader.SpiderLoader.list">
│ │ │  <code class="sig-name descname">list</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/spiderloader.html#SpiderLoader.list"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.spiderloader.SpiderLoader.list" title="Permalink to this definition">¶</a></dt>
│ │ │ @@ -850,16 +850,16 @@
│ │ │  <dd><p>Connect a receiver function to a signal.</p>
│ │ │  <p>The signal can be any object, although Scrapy comes with some
│ │ │  predefined signals that are documented in the <a class="reference internal" href="signals.html#topics-signals"><span class="std std-ref">Signals</span></a>
│ │ │  section.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>receiver</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.9)"><em>collections.abc.Callable</em></a>) – the function to be connected</p></li>
│ │ │ -<li><p><strong>signal</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the signal to connect to</p></li>
│ │ │ +<li><p><strong>receiver</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.10)"><em>collections.abc.Callable</em></a>) – the function to be connected</p></li>
│ │ │ +<li><p><strong>signal</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the signal to connect to</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.signalmanager.SignalManager.disconnect">
│ │ │ @@ -871,15 +871,15 @@
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.signalmanager.SignalManager.disconnect_all">
│ │ │  <code class="sig-name descname">disconnect_all</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">signal</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/signalmanager.html#SignalManager.disconnect_all"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.signalmanager.SignalManager.disconnect_all" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Disconnect all receivers from the given signal.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>signal</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – the signal to disconnect from</p>
│ │ │ +<dd class="field-odd"><p><strong>signal</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – the signal to disconnect from</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.signalmanager.SignalManager.send_catch_log">
│ │ │  <code class="sig-name descname">send_catch_log</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">signal</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/signalmanager.html#SignalManager.send_catch_log"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.signalmanager.SignalManager.send_catch_log" title="Permalink to this definition">¶</a></dt>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/architecture.html
│ │ │ @@ -349,15 +349,15 @@
│ │ │  <h2>Event-driven networking<a class="headerlink" href="#event-driven-networking" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Scrapy is written with <a class="reference external" href="https://twistedmatrix.com/trac/">Twisted</a>, a popular event-driven networking framework
│ │ │  for Python. Thus, it’s implemented using a non-blocking (aka asynchronous) code
│ │ │  for concurrency.</p>
│ │ │  <p>For more information about asynchronous programming and Twisted see these
│ │ │  links:</p>
│ │ │  <ul class="simple">
│ │ │ -<li><p><a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v20.3)"><span>Introduction to Deferreds</span></a></p></li>
│ │ │ +<li><p><a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v21.2)"><span>Introduction to Deferreds</span></a></p></li>
│ │ │  <li><p><a class="reference external" href="http://jessenoller.com/blog/2009/02/11/twisted-hello-asynchronous-programming/">Twisted - hello, asynchronous programming</a></p></li>
│ │ │  <li><p><a class="reference external" href="http://krondo.com/an-introduction-to-asynchronous-programming-and-twisted/">Twisted Introduction - Krondo</a></p></li>
│ │ │  </ul>
│ │ │  </div>
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/asyncio.html
│ │ │ @@ -220,26 +220,26 @@
│ │ │             <div itemprop="articleBody">
│ │ │              
│ │ │    <div class="section" id="asyncio">
│ │ │  <span id="using-asyncio"></span><h1>asyncio<a class="headerlink" href="#asyncio" title="Permalink to this headline">¶</a></h1>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.0.</span></p>
│ │ │  </div>
│ │ │ -<p>Scrapy has partial support <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>. After you <a class="reference internal" href="#install-asyncio"><span class="std std-ref">install the asyncio
│ │ │ -reactor</span></a>, you may use <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries in any <a class="reference internal" href="coroutines.html"><span class="doc">coroutine</span></a>.</p>
│ │ │ +<p>Scrapy has partial support <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>. After you <a class="reference internal" href="#install-asyncio"><span class="std std-ref">install the asyncio
│ │ │ +reactor</span></a>, you may use <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> and
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a>-powered libraries in any <a class="reference internal" href="coroutines.html"><span class="doc">coroutine</span></a>.</p>
│ │ │  <div class="admonition warning">
│ │ │  <p class="admonition-title">Warning</p>
│ │ │ -<p><a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support in Scrapy is experimental. Future Scrapy
│ │ │ +<p><a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support in Scrapy is experimental. Future Scrapy
│ │ │  versions may introduce related changes without a deprecation
│ │ │  period or warning.</p>
│ │ │  </div>
│ │ │  <div class="section" id="installing-the-asyncio-reactor">
│ │ │  <span id="install-asyncio"></span><h2>Installing the asyncio reactor<a class="headerlink" href="#installing-the-asyncio-reactor" title="Permalink to this headline">¶</a></h2>
│ │ │ -<p>To enable <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support, set the <a class="reference internal" href="settings.html#std-setting-TWISTED_REACTOR"><code class="xref std std-setting docutils literal notranslate"><span class="pre">TWISTED_REACTOR</span></code></a> setting to
│ │ │ +<p>To enable <a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> support, set the <a class="reference internal" href="settings.html#std-setting-TWISTED_REACTOR"><code class="xref std std-setting docutils literal notranslate"><span class="pre">TWISTED_REACTOR</span></code></a> setting to
│ │ │  <code class="docutils literal notranslate"><span class="pre">'twisted.internet.asyncioreactor.AsyncioSelectorReactor'</span></code>.</p>
│ │ │  <p>If you are using <a class="reference internal" href="api.html#scrapy.crawler.CrawlerRunner" title="scrapy.crawler.CrawlerRunner"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerRunner</span></code></a>, you also need to
│ │ │  install the <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.asyncioreactor.AsyncioSelectorReactor.html" title="(in Twisted v2.0)"><code class="xref py py-class docutils literal notranslate"><span class="pre">AsyncioSelectorReactor</span></code></a>
│ │ │  reactor manually. You can do that using
│ │ │  <a class="reference internal" href="settings.html#scrapy.utils.reactor.install_reactor" title="scrapy.utils.reactor.install_reactor"><code class="xref py py-func docutils literal notranslate"><span class="pre">install_reactor()</span></code></a>:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">install_reactor</span><span class="p">(</span><span class="s1">&#39;twisted.internet.asyncioreactor.AsyncioSelectorReactor&#39;</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/contracts.html
│ │ │ @@ -297,16 +297,16 @@
│ │ │  override three methods:</p>
│ │ │  <span class="target" id="module-scrapy.contracts"></span><dl class="py class">
│ │ │  <dt id="scrapy.contracts.Contract">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.contracts.</code><code class="sig-name descname">Contract</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">method</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">args</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/contracts.html#Contract"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.contracts.Contract" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>method</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.9)"><em>collections.abc.Callable</em></a>) – callback function to which the contract is associated</p></li>
│ │ │ -<li><p><strong>args</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – list of arguments passed into the docstring (whitespace
│ │ │ +<li><p><strong>method</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.10)"><em>collections.abc.Callable</em></a>) – callback function to which the contract is associated</p></li>
│ │ │ +<li><p><strong>args</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – list of arguments passed into the docstring (whitespace
│ │ │  separated)</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.contracts.Contract.adjust_request_args">
│ │ │  <code class="sig-name descname">adjust_request_args</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">args</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/contracts.html#Contract.adjust_request_args"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.contracts.Contract.adjust_request_args" title="Permalink to this definition">¶</a></dt>
│ │ │ @@ -360,15 +360,15 @@
│ │ │                  <span class="k">raise</span> <span class="n">ContractFail</span><span class="p">(</span><span class="s1">&#39;X-CustomHeader not present&#39;</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="detecting-check-runs">
│ │ │  <span id="detecting-contract-check-runs"></span><h2>Detecting check runs<a class="headerlink" href="#detecting-check-runs" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>When <code class="docutils literal notranslate"><span class="pre">scrapy</span> <span class="pre">check</span></code> is running, the <code class="docutils literal notranslate"><span class="pre">SCRAPY_CHECK</span></code> environment variable is
│ │ │ -set to the <code class="docutils literal notranslate"><span class="pre">true</span></code> string. You can use <a class="reference external" href="https://docs.python.org/3/library/os.html#os.environ" title="(in Python v3.9)"><code class="xref py py-data docutils literal notranslate"><span class="pre">os.environ</span></code></a> to perform any change to
│ │ │ +set to the <code class="docutils literal notranslate"><span class="pre">true</span></code> string. You can use <a class="reference external" href="https://docs.python.org/3/library/os.html#os.environ" title="(in Python v3.10)"><code class="xref py py-data docutils literal notranslate"><span class="pre">os.environ</span></code></a> to perform any change to
│ │ │  your spiders or your settings when <code class="docutils literal notranslate"><span class="pre">scrapy</span> <span class="pre">check</span></code> is used:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">os</span>
│ │ │  <span class="kn">import</span> <span class="nn">scrapy</span>
│ │ │  
│ │ │  <span class="k">class</span> <span class="nc">ExampleSpider</span><span class="p">(</span><span class="n">scrapy</span><span class="o">.</span><span class="n">Spider</span><span class="p">):</span>
│ │ │      <span class="n">name</span> <span class="o">=</span> <span class="s1">&#39;example&#39;</span>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/coroutines.html
│ │ │ @@ -221,15 +221,15 @@
│ │ │              
│ │ │    <div class="section" id="coroutines">
│ │ │  <h1>Coroutines<a class="headerlink" href="#coroutines" title="Permalink to this headline">¶</a></h1>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.0.</span></p>
│ │ │  </div>
│ │ │  <p>Scrapy has <a class="reference internal" href="#coroutine-support"><span class="std std-ref">partial support</span></a> for the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.9)"><span class="xref std std-ref">coroutine syntax</span></a>.</p>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/reference/compound_stmts.html#async" title="(in Python v3.10)"><span class="xref std std-ref">coroutine syntax</span></a>.</p>
│ │ │  <div class="section" id="supported-callables">
│ │ │  <span id="coroutine-support"></span><h2>Supported callables<a class="headerlink" href="#supported-callables" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>The following callables may be defined as coroutines using <code class="docutils literal notranslate"><span class="pre">async</span> <span class="pre">def</span></code>, and
│ │ │  hence use coroutine syntax (e.g. <code class="docutils literal notranslate"><span class="pre">await</span></code>, <code class="docutils literal notranslate"><span class="pre">async</span> <span class="pre">for</span></code>, <code class="docutils literal notranslate"><span class="pre">async</span> <span class="pre">with</span></code>):</p>
│ │ │  <ul>
│ │ │  <li><p><a class="reference internal" href="request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> callbacks.</p>
│ │ │  <div class="admonition note">
│ │ │ @@ -282,15 +282,15 @@
│ │ │          <span class="n">adapter</span> <span class="o">=</span> <span class="n">ItemAdapter</span><span class="p">(</span><span class="n">item</span><span class="p">)</span>
│ │ │          <span class="n">adapter</span><span class="p">[</span><span class="s1">&#39;field&#39;</span><span class="p">]</span> <span class="o">=</span> <span class="k">await</span> <span class="n">db</span><span class="o">.</span><span class="n">get_some_data</span><span class="p">(</span><span class="n">adapter</span><span class="p">[</span><span class="s1">&#39;id&#39;</span><span class="p">])</span>
│ │ │          <span class="k">return</span> <span class="n">item</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>Coroutines may be used to call asynchronous code. This includes other
│ │ │  coroutines, functions that return Deferreds and functions that return
│ │ │ -<a class="reference external" href="https://docs.python.org/3/glossary.html#term-awaitable" title="(in Python v3.9)"><span class="xref std std-term">awaitable objects</span></a> such as <a class="reference external" href="https://docs.python.org/3/library/asyncio-future.html#asyncio.Future" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">Future</span></code></a>.
│ │ │ +<a class="reference external" href="https://docs.python.org/3/glossary.html#term-awaitable" title="(in Python v3.10)"><span class="xref std std-term">awaitable objects</span></a> such as <a class="reference external" href="https://docs.python.org/3/library/asyncio-future.html#asyncio.Future" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">Future</span></code></a>.
│ │ │  This means you can use many useful Python libraries providing such code:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="k">class</span> <span class="nc">MySpider</span><span class="p">(</span><span class="n">Spider</span><span class="p">):</span>
│ │ │      <span class="c1"># ...</span>
│ │ │      <span class="k">async</span> <span class="k">def</span> <span class="nf">parse_with_deferred</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">response</span><span class="p">):</span>
│ │ │          <span class="n">additional_response</span> <span class="o">=</span> <span class="k">await</span> <span class="n">treq</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;https://additional.url&#39;</span><span class="p">)</span>
│ │ │          <span class="n">additional_data</span> <span class="o">=</span> <span class="k">await</span> <span class="n">treq</span><span class="o">.</span><span class="n">content</span><span class="p">(</span><span class="n">additional_response</span><span class="p">)</span>
│ │ │          <span class="c1"># ... use response and additional_data to yield items and requests</span>
│ │ │ @@ -301,15 +301,15 @@
│ │ │                  <span class="n">additional_data</span> <span class="o">=</span> <span class="k">await</span> <span class="n">r</span><span class="o">.</span><span class="n">text</span><span class="p">()</span>
│ │ │          <span class="c1"># ... use response and additional_data to yield items and requests</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <div class="admonition note">
│ │ │  <p class="admonition-title">Note</p>
│ │ │  <p>Many libraries that use coroutines, such as <a class="reference external" href="https://github.com/aio-libs">aio-libs</a>, require the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> loop and to use them you need to
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/asyncio.html#module-asyncio" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">asyncio</span></code></a> loop and to use them you need to
│ │ │  <a class="reference internal" href="asyncio.html"><span class="doc">enable asyncio support in Scrapy</span></a>.</p>
│ │ │  </div>
│ │ │  <p>Common use cases for asynchronous code include:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>requesting data from websites, databases and other services (in callbacks,
│ │ │  pipelines and middlewares);</p></li>
│ │ │  <li><p>storing data in databases (in pipelines and middlewares);</p></li>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/developer-tools.html
│ │ │ @@ -448,16 +448,16 @@
│ │ │  <dl class="py function">
│ │ │  <dt id="scrapy.utils.curl.curl_to_request_kwargs">
│ │ │  <code class="sig-prename descclassname">scrapy.utils.curl.</code><code class="sig-name descname">curl_to_request_kwargs</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">curl_command</span></em>, <em class="sig-param"><span class="n">ignore_unknown_options</span><span class="o">=</span><span class="default_value">True</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/utils/curl.html#curl_to_request_kwargs"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.utils.curl.curl_to_request_kwargs" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Convert a cURL command syntax to Request kwargs.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>curl_command</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – string containing the curl command</p></li>
│ │ │ -<li><p><strong>ignore_unknown_options</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – If true, only a warning is emitted when
│ │ │ +<li><p><strong>curl_command</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – string containing the curl command</p></li>
│ │ │ +<li><p><strong>ignore_unknown_options</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – If true, only a warning is emitted when
│ │ │  cURL options are unknown. Otherwise
│ │ │  raises an error. (default: True)</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  <dt class="field-even">Returns</dt>
│ │ │  <dd class="field-even"><p>dictionary of Request kwargs</p>
│ │ │  </dd>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/downloader-middleware.html
│ │ │ @@ -691,15 +691,15 @@
│ │ │  </div>
│ │ │  <div class="section" id="dbm-storage-backend">
│ │ │  <span id="httpcache-storage-dbm"></span><h4>DBM storage backend<a class="headerlink" href="#dbm-storage-backend" title="Permalink to this headline">¶</a></h4>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.extensions.httpcache.DbmCacheStorage">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.extensions.httpcache.</code><code class="sig-name descname">DbmCacheStorage</code><a class="reference internal" href="../_modules/scrapy/extensions/httpcache.html#DbmCacheStorage"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.extensions.httpcache.DbmCacheStorage" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A <a class="reference external" href="https://en.wikipedia.org/wiki/Dbm">DBM</a> storage backend is also available for the HTTP cache middleware.</p>
│ │ │ -<p>By default, it uses the <a class="reference external" href="https://docs.python.org/3/library/dbm.html#module-dbm" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">dbm</span></code></a>, but you can change it with the
│ │ │ +<p>By default, it uses the <a class="reference external" href="https://docs.python.org/3/library/dbm.html#module-dbm" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">dbm</span></code></a>, but you can change it with the
│ │ │  <a class="reference internal" href="#std-setting-HTTPCACHE_DBM_MODULE"><code class="xref std std-setting docutils literal notranslate"><span class="pre">HTTPCACHE_DBM_MODULE</span></code></a> setting.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  <div class="section" id="writing-your-own-storage-backend">
│ │ │  <span id="httpcache-storage-custom"></span><h4>Writing your own storage backend<a class="headerlink" href="#writing-your-own-storage-backend" title="Permalink to this headline">¶</a></h4>
│ │ │  <p>You can implement a cache storage backend by creating a Python class that
│ │ │ @@ -876,15 +876,15 @@
│ │ │  <div class="section" id="module-scrapy.downloadermiddlewares.httpproxy">
│ │ │  <span id="httpproxymiddleware"></span><h3>HttpProxyMiddleware<a class="headerlink" href="#module-scrapy.downloadermiddlewares.httpproxy" title="Permalink to this headline">¶</a></h3>
│ │ │  <span class="target" id="std-reqmeta-proxy"><span id="std:reqmeta-proxy"></span></span><dl class="py class">
│ │ │  <dt id="scrapy.downloadermiddlewares.httpproxy.HttpProxyMiddleware">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.downloadermiddlewares.httpproxy.</code><code class="sig-name descname">HttpProxyMiddleware</code><a class="reference internal" href="../_modules/scrapy/downloadermiddlewares/httpproxy.html#HttpProxyMiddleware"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.downloadermiddlewares.httpproxy.HttpProxyMiddleware" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>This middleware sets the HTTP proxy to use for requests, by setting the
│ │ │  <code class="docutils literal notranslate"><span class="pre">proxy</span></code> meta value for <a class="reference internal" href="request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> objects.</p>
│ │ │ -<p>Like the Python standard library module <a class="reference external" href="https://docs.python.org/3/library/urllib.request.html#module-urllib.request" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">urllib.request</span></code></a>, it obeys
│ │ │ +<p>Like the Python standard library module <a class="reference external" href="https://docs.python.org/3/library/urllib.request.html#module-urllib.request" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">urllib.request</span></code></a>, it obeys
│ │ │  the following environment variables:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">http_proxy</span></code></p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">https_proxy</span></code></p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">no_proxy</span></code></p></li>
│ │ │  </ul>
│ │ │  <p>You can also set the meta key <code class="docutils literal notranslate"><span class="pre">proxy</span></code> per-request, to a value like
│ │ │ @@ -1086,15 +1086,15 @@
│ │ │  <li><p>supports wildcard matching</p></li>
│ │ │  <li><p>uses the length based rule</p></li>
│ │ │  </ul>
│ │ │  <p>Scrapy uses this parser by default.</p>
│ │ │  </div>
│ │ │  <div class="section" id="robotfileparser">
│ │ │  <span id="python-robotfileparser"></span><h4>RobotFileParser<a class="headerlink" href="#robotfileparser" title="Permalink to this headline">¶</a></h4>
│ │ │ -<p>Based on <a class="reference external" href="https://docs.python.org/3/library/urllib.robotparser.html#urllib.robotparser.RobotFileParser" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">RobotFileParser</span></code></a>:</p>
│ │ │ +<p>Based on <a class="reference external" href="https://docs.python.org/3/library/urllib.robotparser.html#urllib.robotparser.RobotFileParser" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">RobotFileParser</span></code></a>:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>is Python’s built-in <a class="reference external" href="https://www.robotstxt.org/">robots.txt</a> parser</p></li>
│ │ │  <li><p>is compliant with <a class="reference external" href="https://www.robotstxt.org/norobots-rfc.txt">Martijn Koster’s 1996 draft specification</a></p></li>
│ │ │  <li><p>lacks support for wildcard matching</p></li>
│ │ │  <li><p>doesn’t use the length based rule</p></li>
│ │ │  </ul>
│ │ │  <p>It is faster than Protego and backward-compatible with versions of Scrapy before 1.8.0.</p>
│ │ │ @@ -1149,31 +1149,31 @@
│ │ │  <dd><dl class="py method">
│ │ │  <dt id="scrapy.robotstxt.RobotParser.allowed">
│ │ │  <em class="property">abstract </em><code class="sig-name descname">allowed</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">url</span></em>, <em class="sig-param"><span class="n">user_agent</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/robotstxt.html#RobotParser.allowed"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.robotstxt.RobotParser.allowed" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Return <code class="docutils literal notranslate"><span class="pre">True</span></code> if  <code class="docutils literal notranslate"><span class="pre">user_agent</span></code> is allowed to crawl <code class="docutils literal notranslate"><span class="pre">url</span></code>, otherwise return <code class="docutils literal notranslate"><span class="pre">False</span></code>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – Absolute URL</p></li>
│ │ │ -<li><p><strong>user_agent</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – User agent</p></li>
│ │ │ +<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – Absolute URL</p></li>
│ │ │ +<li><p><strong>user_agent</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – User agent</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.robotstxt.RobotParser.from_crawler">
│ │ │  <em class="property">abstract classmethod </em><code class="sig-name descname">from_crawler</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">crawler</span></em>, <em class="sig-param"><span class="n">robotstxt_body</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/robotstxt.html#RobotParser.from_crawler"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.robotstxt.RobotParser.from_crawler" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Parse the content of a <a class="reference external" href="https://www.robotstxt.org/">robots.txt</a> file as bytes. This must be a class method.
│ │ │  It must return a new instance of the parser backend.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>crawler</strong> (<a class="reference internal" href="api.html#scrapy.crawler.Crawler" title="scrapy.crawler.Crawler"><code class="xref py py-class docutils literal notranslate"><span class="pre">Crawler</span></code></a> instance) – crawler which made the request</p></li>
│ │ │ -<li><p><strong>robotstxt_body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><em>bytes</em></a>) – content of a <a class="reference external" href="https://www.robotstxt.org/">robots.txt</a> file.</p></li>
│ │ │ +<li><p><strong>robotstxt_body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><em>bytes</em></a>) – content of a <a class="reference external" href="https://www.robotstxt.org/">robots.txt</a> file.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </dd></dl>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/dynamic-content.html
│ │ │ @@ -301,30 +301,30 @@
│ │ │  </div>
│ │ │  <div class="section" id="handling-different-response-formats">
│ │ │  <span id="topics-handling-response-formats"></span><h2>Handling different response formats<a class="headerlink" href="#handling-different-response-formats" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Once you have a response with the desired data, how you extract the desired
│ │ │  data from it depends on the type of response:</p>
│ │ │  <ul>
│ │ │  <li><p>If the response is HTML or XML, use <a class="reference internal" href="selectors.html#topics-selectors"><span class="std std-ref">selectors</span></a> as usual.</p></li>
│ │ │ -<li><p>If the response is JSON, use <a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a> to load the desired data from
│ │ │ +<li><p>If the response is JSON, use <a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a> to load the desired data from
│ │ │  <a class="reference internal" href="request-response.html#scrapy.http.TextResponse.text" title="scrapy.http.TextResponse.text"><code class="xref py py-attr docutils literal notranslate"><span class="pre">response.text</span></code></a>:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">data</span> <span class="o">=</span> <span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">response</span><span class="o">.</span><span class="n">text</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>If the desired data is inside HTML or XML code embedded within JSON data,
│ │ │  you can load that HTML or XML code into a
│ │ │  <a class="reference internal" href="selectors.html#scrapy.selector.Selector" title="scrapy.selector.Selector"><code class="xref py py-class docutils literal notranslate"><span class="pre">Selector</span></code></a> and then
│ │ │  <a class="reference internal" href="selectors.html#topics-selectors"><span class="std std-ref">use it</span></a> as usual:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">selector</span> <span class="o">=</span> <span class="n">Selector</span><span class="p">(</span><span class="n">data</span><span class="p">[</span><span class="s1">&#39;html&#39;</span><span class="p">])</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </li>
│ │ │  <li><p>If the response is JavaScript, or HTML with a <code class="docutils literal notranslate"><span class="pre">&lt;script/&gt;</span></code> element
│ │ │  containing the desired data, see <a class="reference internal" href="#topics-parsing-javascript"><span class="std std-ref">Parsing JavaScript code</span></a>.</p></li>
│ │ │ -<li><p>If the response is CSS, use a <a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.9)"><span class="xref std std-doc">regular expression</span></a> to
│ │ │ +<li><p>If the response is CSS, use a <a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.10)"><span class="xref std std-doc">regular expression</span></a> to
│ │ │  extract the desired data from
│ │ │  <a class="reference internal" href="request-response.html#scrapy.http.TextResponse.text" title="scrapy.http.TextResponse.text"><code class="xref py py-attr docutils literal notranslate"><span class="pre">response.text</span></code></a>.</p></li>
│ │ │  </ul>
│ │ │  <ul id="topics-parsing-images">
│ │ │  <li><p>If the response is an image or another format based on images (e.g. PDF),
│ │ │  read the response as bytes from
│ │ │  <code class="xref py py-attr docutils literal notranslate"><span class="pre">response.body</span></code> and use an OCR
│ │ │ @@ -350,27 +350,27 @@
│ │ │  <li><p>If the JavaScript code is within a <code class="docutils literal notranslate"><span class="pre">&lt;script/&gt;</span></code> element of an HTML page,
│ │ │  use <a class="reference internal" href="selectors.html#topics-selectors"><span class="std std-ref">selectors</span></a> to extract the text within that
│ │ │  <code class="docutils literal notranslate"><span class="pre">&lt;script/&gt;</span></code> element.</p></li>
│ │ │  </ul>
│ │ │  <p>Once you have a string with the JavaScript code, you can extract the desired
│ │ │  data from it:</p>
│ │ │  <ul>
│ │ │ -<li><p>You might be able to use a <a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.9)"><span class="xref std std-doc">regular expression</span></a> to
│ │ │ +<li><p>You might be able to use a <a class="reference external" href="https://docs.python.org/3/library/re.html" title="(in Python v3.10)"><span class="xref std std-doc">regular expression</span></a> to
│ │ │  extract the desired data in JSON format, which you can then parse with
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a>.</p>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a>.</p>
│ │ │  <p>For example, if the JavaScript code contains a separate line like
│ │ │  <code class="docutils literal notranslate"><span class="pre">var</span> <span class="pre">data</span> <span class="pre">=</span> <span class="pre">{&quot;field&quot;:</span> <span class="pre">&quot;value&quot;};</span></code> you can extract that data as follows:</p>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">pattern</span> <span class="o">=</span> <span class="sa">r</span><span class="s1">&#39;\bvar\s+data\s*=\s*(\{.*?\})\s*;\s*\n&#39;</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">json_data</span> <span class="o">=</span> <span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;script::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">re_first</span><span class="p">(</span><span class="n">pattern</span><span class="p">)</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">json_data</span><span class="p">)</span>
│ │ │  <span class="go">{&#39;field&#39;: &#39;value&#39;}</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </li>
│ │ │ -<li><p><a class="reference external" href="https://github.com/Nykakin/chompjs">chompjs</a> provides an API to parse JavaScript objects into a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>.</p>
│ │ │ +<li><p><a class="reference external" href="https://github.com/Nykakin/chompjs">chompjs</a> provides an API to parse JavaScript objects into a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>.</p>
│ │ │  <p>For example, if the JavaScript code contains
│ │ │  <code class="docutils literal notranslate"><span class="pre">var</span> <span class="pre">data</span> <span class="pre">=</span> <span class="pre">{field:</span> <span class="pre">&quot;value&quot;,</span> <span class="pre">secondField:</span> <span class="pre">&quot;second</span> <span class="pre">value&quot;};</span></code>
│ │ │  you can extract that data as follows:</p>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">chompjs</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">javascript</span> <span class="o">=</span> <span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;script::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">get</span><span class="p">()</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">data</span> <span class="o">=</span> <span class="n">chompjs</span><span class="o">.</span><span class="n">parse_js_object</span><span class="p">(</span><span class="n">javascript</span><span class="p">)</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="n">data</span>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/email.html
│ │ │ @@ -227,17 +227,17 @@
│ │ │    <hr/>
│ │ │  </div>
│ │ │            <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
│ │ │             <div itemprop="articleBody">
│ │ │              
│ │ │    <div class="section" id="module-scrapy.mail">
│ │ │  <span id="sending-e-mail"></span><span id="topics-email"></span><h1>Sending e-mail<a class="headerlink" href="#module-scrapy.mail" title="Permalink to this headline">¶</a></h1>
│ │ │ -<p>Although Python makes sending e-mails relatively easy via the <a class="reference external" href="https://docs.python.org/3/library/smtplib.html#module-smtplib" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">smtplib</span></code></a>
│ │ │ +<p>Although Python makes sending e-mails relatively easy via the <a class="reference external" href="https://docs.python.org/3/library/smtplib.html#module-smtplib" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">smtplib</span></code></a>
│ │ │  library, Scrapy provides its own facility for sending e-mails which is very
│ │ │ -easy to use and it’s implemented using <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v20.3)"><span class="xref std std-doc">Twisted non-blocking IO</span></a>, to avoid interfering with the non-blocking
│ │ │ +easy to use and it’s implemented using <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v21.2)"><span class="xref std std-doc">Twisted non-blocking IO</span></a>, to avoid interfering with the non-blocking
│ │ │  IO of the crawler. It also provides a simple API for sending attachments and
│ │ │  it’s very easy to configure, with a few <a class="reference internal" href="#topics-email-settings"><span class="std std-ref">settings</span></a>.</p>
│ │ │  <div class="section" id="quick-example">
│ │ │  <h2>Quick example<a class="headerlink" href="#quick-example" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>There are two ways to instantiate the mail sender. You can instantiate it using
│ │ │  the standard <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">scrapy.mail</span> <span class="kn">import</span> <span class="n">MailSender</span>
│ │ │ @@ -253,33 +253,33 @@
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">mailer</span><span class="o">.</span><span class="n">send</span><span class="p">(</span><span class="n">to</span><span class="o">=</span><span class="p">[</span><span class="s2">&quot;someone@example.com&quot;</span><span class="p">],</span> <span class="n">subject</span><span class="o">=</span><span class="s2">&quot;Some subject&quot;</span><span class="p">,</span> <span class="n">body</span><span class="o">=</span><span class="s2">&quot;Some body&quot;</span><span class="p">,</span> <span class="n">cc</span><span class="o">=</span><span class="p">[</span><span class="s2">&quot;another@example.com&quot;</span><span class="p">])</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="mailsender-class-reference">
│ │ │  <h2>MailSender class reference<a class="headerlink" href="#mailsender-class-reference" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>MailSender is the preferred class to use for sending emails from Scrapy, as it
│ │ │ -uses <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v20.3)"><span class="xref std std-doc">Twisted non-blocking IO</span></a>, like the
│ │ │ +uses <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/defer-intro.html" title="(in Twisted v21.2)"><span class="xref std std-doc">Twisted non-blocking IO</span></a>, like the
│ │ │  rest of the framework.</p>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.mail.MailSender">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.mail.</code><code class="sig-name descname">MailSender</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">smtphost</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">mailfrom</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">smtpuser</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">smtppass</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">smtpport</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/mail.html#MailSender"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.mail.MailSender" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>smtphost</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><em>bytes</em></a>) – the SMTP host to use for sending the emails. If omitted, the
│ │ │ +<li><p><strong>smtphost</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><em>bytes</em></a>) – the SMTP host to use for sending the emails. If omitted, the
│ │ │  <a class="reference internal" href="#std-setting-MAIL_HOST"><code class="xref std std-setting docutils literal notranslate"><span class="pre">MAIL_HOST</span></code></a> setting will be used.</p></li>
│ │ │ -<li><p><strong>mailfrom</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the address used to send emails (in the <code class="docutils literal notranslate"><span class="pre">From:</span></code> header).
│ │ │ +<li><p><strong>mailfrom</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the address used to send emails (in the <code class="docutils literal notranslate"><span class="pre">From:</span></code> header).
│ │ │  If omitted, the <a class="reference internal" href="#std-setting-MAIL_FROM"><code class="xref std std-setting docutils literal notranslate"><span class="pre">MAIL_FROM</span></code></a> setting will be used.</p></li>
│ │ │  <li><p><strong>smtpuser</strong> – the SMTP user. If omitted, the <a class="reference internal" href="#std-setting-MAIL_USER"><code class="xref std std-setting docutils literal notranslate"><span class="pre">MAIL_USER</span></code></a>
│ │ │  setting will be used. If not given, no SMTP authentication will be
│ │ │  performed.</p></li>
│ │ │ -<li><p><strong>smtppass</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><em>bytes</em></a>) – the SMTP pass for authentication.</p></li>
│ │ │ -<li><p><strong>smtpport</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the SMTP port to connect to</p></li>
│ │ │ -<li><p><strong>smtptls</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – enforce using SMTP STARTTLS</p></li>
│ │ │ -<li><p><strong>smtpssl</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – enforce using a secure SSL connection</p></li>
│ │ │ +<li><p><strong>smtppass</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><em>bytes</em></a>) – the SMTP pass for authentication.</p></li>
│ │ │ +<li><p><strong>smtpport</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the SMTP port to connect to</p></li>
│ │ │ +<li><p><strong>smtptls</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – enforce using SMTP STARTTLS</p></li>
│ │ │ +<li><p><strong>smtpssl</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – enforce using a secure SSL connection</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.mail.MailSender.from_settings">
│ │ │  <em class="property">classmethod </em><code class="sig-name descname">from_settings</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">settings</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/mail.html#MailSender.from_settings"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.mail.MailSender.from_settings" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Instantiate using a Scrapy settings object, which will respect
│ │ │ @@ -294,25 +294,25 @@
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.mail.MailSender.send">
│ │ │  <code class="sig-name descname">send</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">to</span></em>, <em class="sig-param"><span class="n">subject</span></em>, <em class="sig-param"><span class="n">body</span></em>, <em class="sig-param"><span class="n">cc</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">attachs</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">mimetype</span><span class="o">=</span><span class="default_value">'text/plain'</span></em>, <em class="sig-param"><span class="n">charset</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/mail.html#MailSender.send"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.mail.MailSender.send" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Send email to the given recipients.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>to</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – the e-mail recipients as a string or as a list of strings</p></li>
│ │ │ -<li><p><strong>subject</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the subject of the e-mail</p></li>
│ │ │ -<li><p><strong>cc</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – the e-mails to CC as a string or as a list of strings</p></li>
│ │ │ -<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the e-mail body</p></li>
│ │ │ -<li><p><strong>attachs</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Iterable" title="(in Python v3.9)"><em>collections.abc.Iterable</em></a>) – an iterable of tuples <code class="docutils literal notranslate"><span class="pre">(attach_name,</span> <span class="pre">mimetype,</span>
│ │ │ +<li><p><strong>to</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – the e-mail recipients as a string or as a list of strings</p></li>
│ │ │ +<li><p><strong>subject</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the subject of the e-mail</p></li>
│ │ │ +<li><p><strong>cc</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – the e-mails to CC as a string or as a list of strings</p></li>
│ │ │ +<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the e-mail body</p></li>
│ │ │ +<li><p><strong>attachs</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Iterable" title="(in Python v3.10)"><em>collections.abc.Iterable</em></a>) – an iterable of tuples <code class="docutils literal notranslate"><span class="pre">(attach_name,</span> <span class="pre">mimetype,</span>
│ │ │  <span class="pre">file_object)</span></code> where  <code class="docutils literal notranslate"><span class="pre">attach_name</span></code> is a string with the name that will
│ │ │  appear on the e-mail’s attachment, <code class="docutils literal notranslate"><span class="pre">mimetype</span></code> is the mimetype of the
│ │ │  attachment and <code class="docutils literal notranslate"><span class="pre">file_object</span></code> is a readable file object with the
│ │ │  contents of the attachment</p></li>
│ │ │ -<li><p><strong>mimetype</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the MIME type of the e-mail</p></li>
│ │ │ -<li><p><strong>charset</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the character encoding to use for the e-mail contents</p></li>
│ │ │ +<li><p><strong>mimetype</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the MIME type of the e-mail</p></li>
│ │ │ +<li><p><strong>charset</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the character encoding to use for the e-mail contents</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </dd></dl>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/exceptions.html
│ │ │ @@ -237,15 +237,15 @@
│ │ │  <dl class="py exception">
│ │ │  <dt id="scrapy.exceptions.CloseSpider">
│ │ │  <em class="property">exception </em><code class="sig-prename descclassname">scrapy.exceptions.</code><code class="sig-name descname">CloseSpider</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">reason</span><span class="o">=</span><span class="default_value">'cancelled'</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exceptions.html#CloseSpider"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exceptions.CloseSpider" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>This exception can be raised from a spider callback to request the spider to be
│ │ │  closed/stopped. Supported arguments:</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>reason</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the reason for closing</p>
│ │ │ +<dd class="field-odd"><p><strong>reason</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the reason for closing</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <p>For example:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="k">def</span> <span class="nf">parse_page</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">response</span><span class="p">):</span>
│ │ │      <span class="k">if</span> <span class="s1">&#39;Bandwidth exceeded&#39;</span> <span class="ow">in</span> <span class="n">response</span><span class="o">.</span><span class="n">body</span><span class="p">:</span>
│ │ │ @@ -339,15 +339,15 @@
│ │ │  received in the signal handler that raises the exception. Also, the response
│ │ │  object is marked with <code class="docutils literal notranslate"><span class="pre">&quot;download_stopped&quot;</span></code> in its <code class="xref py py-attr docutils literal notranslate"><span class="pre">Response.flags</span></code>
│ │ │  attribute.</p>
│ │ │  <div class="admonition note">
│ │ │  <p class="admonition-title">Note</p>
│ │ │  <p><code class="docutils literal notranslate"><span class="pre">fail</span></code> is a keyword-only parameter, i.e. raising
│ │ │  <code class="docutils literal notranslate"><span class="pre">StopDownload(False)</span></code> or <code class="docutils literal notranslate"><span class="pre">StopDownload(True)</span></code> will raise
│ │ │ -a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">TypeError</span></code></a>.</p>
│ │ │ +a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#TypeError" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">TypeError</span></code></a>.</p>
│ │ │  </div>
│ │ │  <p>See the documentation for the <a class="reference internal" href="signals.html#scrapy.signals.bytes_received" title="scrapy.signals.bytes_received"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes_received</span></code></a> signal
│ │ │  and the <a class="reference internal" href="request-response.html#topics-stop-response-download"><span class="std std-ref">Stopping the download of a Response</span></a> topic for additional information and examples.</p>
│ │ │  </div>
│ │ │  </div>
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/exporters.html
│ │ │ @@ -374,17 +374,17 @@
│ │ │  <p>By default, this method looks for a serializer <a class="reference internal" href="#topics-exporters-serializers"><span class="std std-ref">declared in the item
│ │ │  field</span></a> and returns the result of applying
│ │ │  that serializer to the value. If no serializer is found, it returns the
│ │ │  value unchanged.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>field</strong> (<a class="reference internal" href="items.html#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> object or a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> instance) – the field being serialized. If the source <a class="reference internal" href="items.html#item-types"><span class="std std-ref">item object</span></a> does not define field metadata, <em>field</em> is an empty
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>.</p></li>
│ │ │ -<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the name of the field being serialized</p></li>
│ │ │ +<li><p><strong>field</strong> (<a class="reference internal" href="items.html#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> object or a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> instance) – the field being serialized. If the source <a class="reference internal" href="items.html#item-types"><span class="std std-ref">item object</span></a> does not define field metadata, <em>field</em> is an empty
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>.</p></li>
│ │ │ +<li><p><strong>name</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the name of the field being serialized</p></li>
│ │ │  <li><p><strong>value</strong> – the value being serialized</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │ @@ -453,31 +453,31 @@
│ │ │  <h3>PythonItemExporter<a class="headerlink" href="#pythonitemexporter" title="Permalink to this headline">¶</a></h3>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.exporters.PythonItemExporter">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">PythonItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="o">*</span></em>, <em class="sig-param"><span class="n">dont_fail</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#PythonItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.PythonItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>This is a base class for item exporters that extends
│ │ │  <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> with support for nested items.</p>
│ │ │  <p>It serializes items to built-in Python types, so that any serialization
│ │ │ -library (e.g. <a class="reference external" href="https://docs.python.org/3/library/json.html#module-json" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">json</span></code></a> or <a class="reference external" href="https://pypi.org/project/msgpack/">msgpack</a>) can be used on top of it.</p>
│ │ │ +library (e.g. <a class="reference external" href="https://docs.python.org/3/library/json.html#module-json" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">json</span></code></a> or <a class="reference external" href="https://pypi.org/project/msgpack/">msgpack</a>) can be used on top of it.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  <div class="section" id="xmlitemexporter">
│ │ │  <h3>XmlItemExporter<a class="headerlink" href="#xmlitemexporter" title="Permalink to this headline">¶</a></h3>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.exporters.XmlItemExporter">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">XmlItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">file</span></em>, <em class="sig-param"><span class="n">item_element</span><span class="o">=</span><span class="default_value">'item'</span></em>, <em class="sig-param"><span class="n">root_element</span><span class="o">=</span><span class="default_value">'items'</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#XmlItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.XmlItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Exports items in XML format to the specified file object.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>file</strong> – the file-like object to use for exporting the data. Its <code class="docutils literal notranslate"><span class="pre">write</span></code> method should
│ │ │  accept <code class="docutils literal notranslate"><span class="pre">bytes</span></code> (a disk file opened in binary mode, a <code class="docutils literal notranslate"><span class="pre">io.BytesIO</span></code> object, etc)</p></li>
│ │ │ -<li><p><strong>root_element</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – The name of root element in the exported XML.</p></li>
│ │ │ -<li><p><strong>item_element</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – The name of each item element in the exported XML.</p></li>
│ │ │ +<li><p><strong>root_element</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – The name of root element in the exported XML.</p></li>
│ │ │ +<li><p><strong>item_element</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – The name of each item element in the exported XML.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>The additional keyword arguments of this <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method are passed to the
│ │ │  <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method.</p>
│ │ │  <p>A typical output of this exporter would be:</p>
│ │ │  <div class="highlight-none notranslate"><div class="highlight"><pre><span></span>&lt;?xml version=&quot;1.0&quot; encoding=&quot;utf-8&quot;?&gt;
│ │ │ @@ -526,28 +526,28 @@
│ │ │  CSV columns and their order. The <code class="xref py py-attr docutils literal notranslate"><span class="pre">export_empty_fields</span></code> attribute has
│ │ │  no effect on this exporter.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>file</strong> – the file-like object to use for exporting the data. Its <code class="docutils literal notranslate"><span class="pre">write</span></code> method should
│ │ │  accept <code class="docutils literal notranslate"><span class="pre">bytes</span></code> (a disk file opened in binary mode, a <code class="docutils literal notranslate"><span class="pre">io.BytesIO</span></code> object, etc)</p></li>
│ │ │ -<li><p><strong>include_headers_line</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – If enabled, makes the exporter output a header
│ │ │ +<li><p><strong>include_headers_line</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – If enabled, makes the exporter output a header
│ │ │  line with the field names taken from
│ │ │  <a class="reference internal" href="#scrapy.exporters.BaseItemExporter.fields_to_export" title="scrapy.exporters.BaseItemExporter.fields_to_export"><code class="xref py py-attr docutils literal notranslate"><span class="pre">BaseItemExporter.fields_to_export</span></code></a> or the first exported item fields.</p></li>
│ │ │  <li><p><strong>join_multivalued</strong> – The char (or chars) that will be used for joining
│ │ │  multi-valued fields, if found.</p></li>
│ │ │ -<li><p><strong>errors</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – The optional string that specifies how encoding and decoding
│ │ │ +<li><p><strong>errors</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – The optional string that specifies how encoding and decoding
│ │ │  errors are to be handled. For more information see
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/io.html#io.TextIOWrapper" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">io.TextIOWrapper</span></code></a>.</p></li>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/io.html#io.TextIOWrapper" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">io.TextIOWrapper</span></code></a>.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>The additional keyword arguments of this <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method are passed to the
│ │ │  <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, and the leftover arguments to the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/csv.html#csv.writer" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">csv.writer()</span></code></a> function, so you can use any <a class="reference external" href="https://docs.python.org/3/library/csv.html#csv.writer" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">csv.writer()</span></code></a> function
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/csv.html#csv.writer" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">csv.writer()</span></code></a> function, so you can use any <a class="reference external" href="https://docs.python.org/3/library/csv.html#csv.writer" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">csv.writer()</span></code></a> function
│ │ │  argument to customize this exporter.</p>
│ │ │  <p>A typical output of this exporter would be:</p>
│ │ │  <div class="highlight-none notranslate"><div class="highlight"><pre><span></span>product,price
│ │ │  Color TV,1200
│ │ │  DVD player,200
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ @@ -561,19 +561,19 @@
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">PickleItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">file</span></em>, <em class="sig-param"><span class="n">protocol</span><span class="o">=</span><span class="default_value">0</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#PickleItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.PickleItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Exports items in pickle format to the given file-like object.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>file</strong> – the file-like object to use for exporting the data. Its <code class="docutils literal notranslate"><span class="pre">write</span></code> method should
│ │ │  accept <code class="docutils literal notranslate"><span class="pre">bytes</span></code> (a disk file opened in binary mode, a <code class="docutils literal notranslate"><span class="pre">io.BytesIO</span></code> object, etc)</p></li>
│ │ │ -<li><p><strong>protocol</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – The pickle protocol to use.</p></li>
│ │ │ +<li><p><strong>protocol</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – The pickle protocol to use.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │ -<p>For more information, see <a class="reference external" href="https://docs.python.org/3/library/pickle.html#module-pickle" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">pickle</span></code></a>.</p>
│ │ │ +<p>For more information, see <a class="reference external" href="https://docs.python.org/3/library/pickle.html#module-pickle" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">pickle</span></code></a>.</p>
│ │ │  <p>The additional keyword arguments of this <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method are passed to the
│ │ │  <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method.</p>
│ │ │  <p>Pickle isn’t a human readable format, so no output examples are provided.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  <div class="section" id="pprintitemexporter">
│ │ │ @@ -603,16 +603,16 @@
│ │ │  <h3>JsonItemExporter<a class="headerlink" href="#jsonitemexporter" title="Permalink to this headline">¶</a></h3>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.exporters.JsonItemExporter">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">JsonItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">file</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#JsonItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.JsonItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Exports items in JSON format to the specified file-like object, writing all
│ │ │  objects as a list of objects. The additional <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method arguments are
│ │ │  passed to the <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, and the leftover
│ │ │ -arguments to the <a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, so you can use any
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method argument to customize this exporter.</p>
│ │ │ +arguments to the <a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, so you can use any
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method argument to customize this exporter.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><p><strong>file</strong> – the file-like object to use for exporting the data. Its <code class="docutils literal notranslate"><span class="pre">write</span></code> method should
│ │ │  accept <code class="docutils literal notranslate"><span class="pre">bytes</span></code> (a disk file opened in binary mode, a <code class="docutils literal notranslate"><span class="pre">io.BytesIO</span></code> object, etc)</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>A typical output of this exporter would be:</p>
│ │ │ @@ -637,16 +637,16 @@
│ │ │  <h3>JsonLinesItemExporter<a class="headerlink" href="#jsonlinesitemexporter" title="Permalink to this headline">¶</a></h3>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.exporters.JsonLinesItemExporter">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">JsonLinesItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">file</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#JsonLinesItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.JsonLinesItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Exports items in JSON format to the specified file-like object, writing one
│ │ │  JSON-encoded item per line. The additional <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method arguments are passed
│ │ │  to the <a class="reference internal" href="#scrapy.exporters.BaseItemExporter" title="scrapy.exporters.BaseItemExporter"><code class="xref py py-class docutils literal notranslate"><span class="pre">BaseItemExporter</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, and the leftover arguments to
│ │ │ -the <a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, so you can use any
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method argument to customize this exporter.</p>
│ │ │ +the <a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, so you can use any
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/json.html#json.JSONEncoder" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">JSONEncoder</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method argument to customize this exporter.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><p><strong>file</strong> – the file-like object to use for exporting the data. Its <code class="docutils literal notranslate"><span class="pre">write</span></code> method should
│ │ │  accept <code class="docutils literal notranslate"><span class="pre">bytes</span></code> (a disk file opened in binary mode, a <code class="docutils literal notranslate"><span class="pre">io.BytesIO</span></code> object, etc)</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>A typical output of this exporter would be:</p>
│ │ │ @@ -661,20 +661,20 @@
│ │ │  </div>
│ │ │  <div class="section" id="marshalitemexporter">
│ │ │  <h3>MarshalItemExporter<a class="headerlink" href="#marshalitemexporter" title="Permalink to this headline">¶</a></h3>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.exporters.MarshalItemExporter">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.exporters.</code><code class="sig-name descname">MarshalItemExporter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">file</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/exporters.html#MarshalItemExporter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.exporters.MarshalItemExporter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Exports items in a Python-specific binary format (see
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/marshal.html#module-marshal" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">marshal</span></code></a>).</p>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/marshal.html#module-marshal" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">marshal</span></code></a>).</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><p><strong>file</strong> – The file-like object to use for exporting the data. Its
│ │ │ -<code class="docutils literal notranslate"><span class="pre">write</span></code> method should accept <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> (a disk file
│ │ │ -opened in binary mode, a <a class="reference external" href="https://docs.python.org/3/library/io.html#io.BytesIO" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">BytesIO</span></code></a> object, etc)</p>
│ │ │ +<code class="docutils literal notranslate"><span class="pre">write</span></code> method should accept <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> (a disk file
│ │ │ +opened in binary mode, a <a class="reference external" href="https://docs.python.org/3/library/io.html#io.BytesIO" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">BytesIO</span></code></a> object, etc)</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  </div>
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/extensions.html
│ │ │ @@ -554,15 +554,15 @@
│ │ │  <div class="section" id="debugger-extension">
│ │ │  <h4>Debugger extension<a class="headerlink" href="#debugger-extension" title="Permalink to this headline">¶</a></h4>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.extensions.debug.Debugger">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.extensions.debug.</code><code class="sig-name descname">Debugger</code><a class="reference internal" href="../_modules/scrapy/extensions/debug.html#Debugger"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.extensions.debug.Debugger" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd></dd></dl>
│ │ │  
│ │ │ -<p>Invokes a <a class="reference external" href="https://docs.python.org/3/library/pdb.html" title="(in Python v3.9)"><span class="xref std std-doc">Python debugger</span></a> inside a running Scrapy process when a <a class="reference external" href="https://en.wikipedia.org/wiki/SIGUSR1_and_SIGUSR2">SIGUSR2</a>
│ │ │ +<p>Invokes a <a class="reference external" href="https://docs.python.org/3/library/pdb.html" title="(in Python v3.10)"><span class="xref std std-doc">Python debugger</span></a> inside a running Scrapy process when a <a class="reference external" href="https://en.wikipedia.org/wiki/SIGUSR1_and_SIGUSR2">SIGUSR2</a>
│ │ │  signal is received. After the debugger is exited, the Scrapy process continues
│ │ │  running normally.</p>
│ │ │  <p>For more info see <a class="reference external" href="https://pythonconquerstheuniverse.wordpress.com/2009/09/10/debugging-in-python/">Debugging in Python</a>.</p>
│ │ │  <p>This extension only works on POSIX-compliant platforms (i.e. not Windows).</p>
│ │ │  </div>
│ │ │  </div>
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/feed-exports.html
│ │ │ @@ -518,15 +518,15 @@
│ │ │  </div></blockquote>
│ │ │  <div class="section" id="feeds">
│ │ │  <span id="std-setting-FEEDS"></span><span id="std:setting-FEEDS"></span><h3>FEEDS<a class="headerlink" href="#feeds" title="Permalink to this headline">¶</a></h3>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.1.</span></p>
│ │ │  </div>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">{}</span></code></p>
│ │ │ -<p>A dictionary in which every key is a feed URI (or a <a class="reference external" href="https://docs.python.org/3/library/pathlib.html#pathlib.Path" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">pathlib.Path</span></code></a>
│ │ │ +<p>A dictionary in which every key is a feed URI (or a <a class="reference external" href="https://docs.python.org/3/library/pathlib.html#pathlib.Path" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">pathlib.Path</span></code></a>
│ │ │  object) and each value is a nested dictionary containing configuration
│ │ │  parameters for the specific feed.</p>
│ │ │  <p>This setting is required for enabling the feed export feature.</p>
│ │ │  <p>See <a class="reference internal" href="#topics-feed-storage-backends"><span class="std std-ref">Storage backends</span></a> for supported URI schemes.</p>
│ │ │  <p>For instance:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="p">{</span>
│ │ │      <span class="s1">&#39;items.json&#39;</span><span class="p">:</span> <span class="p">{</span>
│ │ │ @@ -563,15 +563,15 @@
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.3.0.</span></p>
│ │ │  </div>
│ │ │  </li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">encoding</span></code>: falls back to <a class="reference internal" href="#std-setting-FEED_EXPORT_ENCODING"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_EXPORT_ENCODING</span></code></a>.</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">fields</span></code>: falls back to <a class="reference internal" href="#std-setting-FEED_EXPORT_FIELDS"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_EXPORT_FIELDS</span></code></a>.</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">indent</span></code>: falls back to <a class="reference internal" href="#std-setting-FEED_EXPORT_INDENT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_EXPORT_INDENT</span></code></a>.</p></li>
│ │ │ -<li><p><code class="docutils literal notranslate"><span class="pre">item_export_kwargs</span></code>: <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> with keyword arguments for the corresponding <a class="reference internal" href="exporters.html#topics-exporters"><span class="std std-ref">item exporter class</span></a>.</p>
│ │ │ +<li><p><code class="docutils literal notranslate"><span class="pre">item_export_kwargs</span></code>: <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> with keyword arguments for the corresponding <a class="reference internal" href="exporters.html#topics-exporters"><span class="std std-ref">item exporter class</span></a>.</p>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.4.0.</span></p>
│ │ │  </div>
│ │ │  </li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">overwrite</span></code>: whether to overwrite the file if it already exists
│ │ │  (<code class="docutils literal notranslate"><span class="pre">True</span></code>) or append to its content (<code class="docutils literal notranslate"><span class="pre">False</span></code>).</p>
│ │ │  <p>The default value depends on the <a class="reference internal" href="#topics-feed-storage-backends"><span class="std std-ref">storage backend</span></a>:</p>
│ │ │ @@ -715,15 +715,15 @@
│ │ │  <p>When generating multiple output files, you must use at least one of the following
│ │ │  placeholders in the feed URI to indicate how the different output file names are
│ │ │  generated:</p>
│ │ │  <ul>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">%(batch_time)s</span></code> - gets replaced by a timestamp when the feed is being created
│ │ │  (e.g. <code class="docutils literal notranslate"><span class="pre">2020-03-28T14-45-08.237134</span></code>)</p></li>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">%(batch_id)d</span></code> - gets replaced by the 1-based sequence number of the batch.</p>
│ │ │ -<p>Use <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.9)"><span class="xref std std-ref">printf-style string formatting</span></a> to
│ │ │ +<p>Use <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.10)"><span class="xref std std-ref">printf-style string formatting</span></a> to
│ │ │  alter the number format. For example, to make the batch ID a 5-digit
│ │ │  number by introducing leading zeroes as needed, use <code class="docutils literal notranslate"><span class="pre">%(batch_id)05d</span></code>
│ │ │  (e.g. <code class="docutils literal notranslate"><span class="pre">3</span></code> becomes <code class="docutils literal notranslate"><span class="pre">00003</span></code>, <code class="docutils literal notranslate"><span class="pre">123</span></code> becomes <code class="docutils literal notranslate"><span class="pre">00123</span></code>).</p>
│ │ │  </li>
│ │ │  </ul>
│ │ │  <p>For instance, if your settings include:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">FEED_EXPORT_BATCH_ITEM_COUNT</span> <span class="o">=</span> <span class="mi">100</span>
│ │ │ @@ -744,26 +744,26 @@
│ │ │  <p>Where the first and second files contain exactly 100 items. The last one contains
│ │ │  100 items or fewer.</p>
│ │ │  </div>
│ │ │  <div class="section" id="feed-uri-params">
│ │ │  <span id="std-setting-FEED_URI_PARAMS"></span><span id="std:setting-FEED_URI_PARAMS"></span><h3>FEED_URI_PARAMS<a class="headerlink" href="#feed-uri-params" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">None</span></code></p>
│ │ │  <p>A string with the import path of a function to set the parameters to apply with
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.9)"><span class="xref std std-ref">printf-style string formatting</span></a> to the
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.10)"><span class="xref std std-ref">printf-style string formatting</span></a> to the
│ │ │  feed URI.</p>
│ │ │  <p>The function signature should be as follows:</p>
│ │ │  <dl class="py function">
│ │ │  <dt id="scrapy.extensions.feedexport.uri_params">
│ │ │  <code class="sig-prename descclassname">scrapy.extensions.feedexport.</code><code class="sig-name descname">uri_params</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">params</span></em>, <em class="sig-param"><span class="n">spider</span></em><span class="sig-paren">)</span><a class="headerlink" href="#scrapy.extensions.feedexport.uri_params" title="Permalink to this definition">¶</a></dt>
│ │ │ -<dd><p>Return a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> of key-value pairs to apply to the feed URI using
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.9)"><span class="xref std std-ref">printf-style string formatting</span></a>.</p>
│ │ │ +<dd><p>Return a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> of key-value pairs to apply to the feed URI using
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#old-string-formatting" title="(in Python v3.10)"><span class="xref std std-ref">printf-style string formatting</span></a>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>params</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – <p>default key-value pairs</p>
│ │ │ +<li><p><strong>params</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – <p>default key-value pairs</p>
│ │ │  <p>Specifically:</p>
│ │ │  <ul>
│ │ │  <li><p><code class="docutils literal notranslate"><span class="pre">batch_id</span></code>: ID of the file batch. See
│ │ │  <a class="reference internal" href="#std-setting-FEED_EXPORT_BATCH_ITEM_COUNT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_EXPORT_BATCH_ITEM_COUNT</span></code></a>.</p>
│ │ │  <p>If <a class="reference internal" href="#std-setting-FEED_EXPORT_BATCH_ITEM_COUNT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">FEED_EXPORT_BATCH_ITEM_COUNT</span></code></a> is <code class="docutils literal notranslate"><span class="pre">0</span></code>, <code class="docutils literal notranslate"><span class="pre">batch_id</span></code>
│ │ │  is always <code class="docutils literal notranslate"><span class="pre">1</span></code>.</p>
│ │ │  <div class="versionadded">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/items.html
│ │ │ @@ -252,28 +252,28 @@
│ │ │  <div class="section" id="item-types">
│ │ │  <span id="id1"></span><h2>Item Types<a class="headerlink" href="#item-types" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Scrapy supports the following types of items, via the <a class="reference external" href="https://github.com/scrapy/itemadapter">itemadapter</a> library:
│ │ │  <a class="reference internal" href="#dict-items"><span class="std std-ref">dictionaries</span></a>, <a class="reference internal" href="#item-objects"><span class="std std-ref">Item objects</span></a>,
│ │ │  <a class="reference internal" href="#dataclass-items"><span class="std std-ref">dataclass objects</span></a>, and <a class="reference internal" href="#attrs-items"><span class="std std-ref">attrs objects</span></a>.</p>
│ │ │  <div class="section" id="dictionaries">
│ │ │  <span id="dict-items"></span><h3>Dictionaries<a class="headerlink" href="#dictionaries" title="Permalink to this headline">¶</a></h3>
│ │ │ -<p>As an item type, <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> is convenient and familiar.</p>
│ │ │ +<p>As an item type, <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> is convenient and familiar.</p>
│ │ │  </div>
│ │ │  <div class="section" id="item-objects">
│ │ │  <span id="id2"></span><h3>Item objects<a class="headerlink" href="#item-objects" title="Permalink to this headline">¶</a></h3>
│ │ │ -<p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> provides a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>-like API plus additional features that
│ │ │ +<p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> provides a <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a>-like API plus additional features that
│ │ │  make it the most feature-complete item type:</p>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.item.Item">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.item.</code><code class="sig-name descname">Item</code><span class="sig-paren">(</span><span class="optional">[</span><em class="sig-param">arg</em><span class="optional">]</span><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/item.html#Item"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.item.Item" title="Permalink to this definition">¶</a></dt>
│ │ │ -<dd><p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> objects replicate the standard <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API, including
│ │ │ +<dd><p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> objects replicate the standard <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API, including
│ │ │  its <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method.</p>
│ │ │  <p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> allows defining field names, so that:</p>
│ │ │  <ul class="simple">
│ │ │ -<li><p><a class="reference external" href="https://docs.python.org/3/library/exceptions.html#KeyError" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">KeyError</span></code></a> is raised when using undefined field names (i.e.
│ │ │ +<li><p><a class="reference external" href="https://docs.python.org/3/library/exceptions.html#KeyError" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">KeyError</span></code></a> is raised when using undefined field names (i.e.
│ │ │  prevents typos going unnoticed)</p></li>
│ │ │  <li><p><a class="reference internal" href="exporters.html#topics-exporters"><span class="std std-ref">Item exporters</span></a> can export all fields by
│ │ │  default even if the first scraped object does not have values for all
│ │ │  of them</p></li>
│ │ │  </ul>
│ │ │  <p><a class="reference internal" href="#scrapy.item.Item" title="scrapy.item.Item"><code class="xref py py-class docutils literal notranslate"><span class="pre">Item</span></code></a> also allows defining field metadata, which can be used to
│ │ │  <a class="reference internal" href="exporters.html#topics-exporters-field-serialization"><span class="std std-ref">customize serialization</span></a>.</p>
│ │ │ @@ -284,15 +284,15 @@
│ │ │  <dt id="scrapy.item.Item.copy">
│ │ │  <code class="sig-name descname">copy</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#scrapy.item.Item.copy" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd></dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.item.Item.deepcopy">
│ │ │  <code class="sig-name descname">deepcopy</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#scrapy.item.Item.deepcopy" title="Permalink to this definition">¶</a></dt>
│ │ │ -<dd><p>Return a <a class="reference external" href="https://docs.python.org/3/library/copy.html#copy.deepcopy" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">deepcopy()</span></code></a> of this item.</p>
│ │ │ +<dd><p>Return a <a class="reference external" href="https://docs.python.org/3/library/copy.html#copy.deepcopy" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">deepcopy()</span></code></a> of this item.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py attribute">
│ │ │  <dt id="scrapy.item.Item.fields">
│ │ │  <code class="sig-name descname">fields</code><a class="headerlink" href="#scrapy.item.Item.fields" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A dictionary containing <em>all declared fields</em> for this Item, not only
│ │ │  those populated. The keys are the field names and the values are the
│ │ │ @@ -311,21 +311,21 @@
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="dataclass-objects">
│ │ │  <span id="dataclass-items"></span><h3>Dataclass objects<a class="headerlink" href="#dataclass-objects" title="Permalink to this headline">¶</a></h3>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.2.</span></p>
│ │ │  </div>
│ │ │ -<p><a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.dataclass" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">dataclass()</span></code></a> allows defining item classes with field names,
│ │ │ +<p><a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.dataclass" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">dataclass()</span></code></a> allows defining item classes with field names,
│ │ │  so that <a class="reference internal" href="exporters.html#topics-exporters"><span class="std std-ref">item exporters</span></a> can export all fields by
│ │ │  default even if the first scraped object does not have values for all of them.</p>
│ │ │  <p>Additionally, <code class="docutils literal notranslate"><span class="pre">dataclass</span></code> items also allow to:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>define the type and default value of each defined field.</p></li>
│ │ │ -<li><p>define custom field metadata through <a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.field" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">dataclasses.field()</span></code></a>, which can be used to
│ │ │ +<li><p>define custom field metadata through <a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.field" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">dataclasses.field()</span></code></a>, which can be used to
│ │ │  <a class="reference internal" href="exporters.html#topics-exporters-field-serialization"><span class="std std-ref">customize serialization</span></a>.</p></li>
│ │ │  </ul>
│ │ │  <p>They work natively in Python 3.7 or later, or using the <a class="reference external" href="https://pypi.org/project/dataclasses/">dataclasses
│ │ │  backport</a> in Python 3.6.</p>
│ │ │  <p>Example:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">dataclasses</span> <span class="kn">import</span> <span class="n">dataclass</span>
│ │ │  
│ │ │ @@ -341,24 +341,24 @@
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="attr-s-objects">
│ │ │  <span id="attrs-items"></span><h3>attr.s objects<a class="headerlink" href="#attr-s-objects" title="Permalink to this headline">¶</a></h3>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.2.</span></p>
│ │ │  </div>
│ │ │ -<p><a class="reference external" href="https://www.attrs.org/en/stable/api.html#attr.s" title="(in attrs v20.3)"><code class="xref py py-func docutils literal notranslate"><span class="pre">attr.s()</span></code></a> allows defining item classes with field names,
│ │ │ +<p><a class="reference external" href="https://www.attrs.org/en/stable/api.html#attr.s" title="(in attrs v21.2)"><code class="xref py py-func docutils literal notranslate"><span class="pre">attr.s()</span></code></a> allows defining item classes with field names,
│ │ │  so that <a class="reference internal" href="exporters.html#topics-exporters"><span class="std std-ref">item exporters</span></a> can export all fields by
│ │ │  default even if the first scraped object does not have values for all of them.</p>
│ │ │  <p>Additionally, <code class="docutils literal notranslate"><span class="pre">attr.s</span></code> items also allow to:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>define the type and default value of each defined field.</p></li>
│ │ │ -<li><p>define custom field <a class="reference external" href="https://www.attrs.org/en/stable/examples.html#metadata" title="(in attrs v20.3)"><span class="xref std std-ref">metadata</span></a>, which can be used to
│ │ │ +<li><p>define custom field <a class="reference external" href="https://www.attrs.org/en/stable/examples.html#metadata" title="(in attrs v21.2)"><span class="xref std std-ref">metadata</span></a>, which can be used to
│ │ │  <a class="reference internal" href="exporters.html#topics-exporters-field-serialization"><span class="std std-ref">customize serialization</span></a>.</p></li>
│ │ │  </ul>
│ │ │ -<p>In order to use this type, the <a class="reference external" href="https://www.attrs.org/en/stable/index.html" title="(in attrs v20.3)"><span class="xref std std-doc">attrs package</span></a> needs to be installed.</p>
│ │ │ +<p>In order to use this type, the <a class="reference external" href="https://www.attrs.org/en/stable/index.html" title="(in attrs v21.2)"><span class="xref std std-doc">attrs package</span></a> needs to be installed.</p>
│ │ │  <p>Example:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">attr</span>
│ │ │  
│ │ │  <span class="nd">@attr</span><span class="o">.</span><span class="n">s</span>
│ │ │  <span class="k">class</span> <span class="nc">CustomItem</span><span class="p">:</span>
│ │ │      <span class="n">one_field</span> <span class="o">=</span> <span class="n">attr</span><span class="o">.</span><span class="n">ib</span><span class="p">()</span>
│ │ │      <span class="n">another_field</span> <span class="o">=</span> <span class="n">attr</span><span class="o">.</span><span class="n">ib</span><span class="p">()</span>
│ │ │ @@ -406,15 +406,15 @@
│ │ │  documentation to see which metadata keys are used by each component.</p>
│ │ │  <p>It’s important to note that the <a class="reference internal" href="#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> objects used to declare the item
│ │ │  do not stay assigned as class attributes. Instead, they can be accessed through
│ │ │  the <a class="reference internal" href="#scrapy.item.Item.fields" title="scrapy.item.Item.fields"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Item.fields</span></code></a> attribute.</p>
│ │ │  <dl class="py class">
│ │ │  <dt id="scrapy.item.Field">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.item.</code><code class="sig-name descname">Field</code><span class="sig-paren">(</span><span class="optional">[</span><em class="sig-param">arg</em><span class="optional">]</span><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/item.html#Field"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.item.Field" title="Permalink to this definition">¶</a></dt>
│ │ │ -<dd><p>The <a class="reference internal" href="#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> class is just an alias to the built-in <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> class and
│ │ │ +<dd><p>The <a class="reference internal" href="#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> class is just an alias to the built-in <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> class and
│ │ │  doesn’t provide any extra functionality or attributes. In other words,
│ │ │  <a class="reference internal" href="#scrapy.item.Field" title="scrapy.item.Field"><code class="xref py py-class docutils literal notranslate"><span class="pre">Field</span></code></a> objects are plain-old Python dicts. A separate class is used
│ │ │  to support the <a class="reference internal" href="#topics-items-declaring"><span class="std std-ref">item declaration syntax</span></a>
│ │ │  based on class attributes.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <div class="admonition note">
│ │ │ @@ -424,15 +424,15 @@
│ │ │  <a class="reference external" href="https://www.attrs.org/en/stable/api.html#attr.ib">attr.ib</a> for additional information.</p>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="id3">
│ │ │  <h3>Working with Item objects<a class="headerlink" href="#id3" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Here are some examples of common tasks performed with items, using the
│ │ │  <code class="docutils literal notranslate"><span class="pre">Product</span></code> item <a class="reference internal" href="#topics-items-declaring"><span class="std std-ref">declared above</span></a>. You will
│ │ │ -notice the API is very similar to the <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API.</p>
│ │ │ +notice the API is very similar to the <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API.</p>
│ │ │  <div class="section" id="creating-items">
│ │ │  <h4>Creating items<a class="headerlink" href="#creating-items" title="Permalink to this headline">¶</a></h4>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">product</span> <span class="o">=</span> <span class="n">Product</span><span class="p">(</span><span class="n">name</span><span class="o">=</span><span class="s1">&#39;Desktop PC&#39;</span><span class="p">,</span> <span class="n">price</span><span class="o">=</span><span class="mi">1000</span><span class="p">)</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="nb">print</span><span class="p">(</span><span class="n">product</span><span class="p">)</span>
│ │ │  <span class="go">Product(name=&#39;Desktop PC&#39;, price=1000)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ @@ -498,37 +498,37 @@
│ │ │      <span class="o">...</span>
│ │ │  <span class="gr">KeyError</span>: <span class="n">&#39;Product does not support field: lala&#39;</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="accessing-all-populated-values">
│ │ │  <h4>Accessing all populated values<a class="headerlink" href="#accessing-all-populated-values" title="Permalink to this headline">¶</a></h4>
│ │ │ -<p>To access all populated values, just use the typical <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API:</p>
│ │ │ +<p>To access all populated values, just use the typical <a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">dict</span></code></a> API:</p>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">product</span><span class="o">.</span><span class="n">keys</span><span class="p">()</span>
│ │ │  <span class="go">[&#39;price&#39;, &#39;name&#39;]</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">product</span><span class="o">.</span><span class="n">items</span><span class="p">()</span>
│ │ │  <span class="go">[(&#39;price&#39;, 1000), (&#39;name&#39;, &#39;Desktop PC&#39;)]</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="copying-items">
│ │ │  <span id="id4"></span><h4>Copying items<a class="headerlink" href="#copying-items" title="Permalink to this headline">¶</a></h4>
│ │ │  <p>To copy an item, you must first decide whether you want a shallow copy or a
│ │ │  deep copy.</p>
│ │ │ -<p>If your item contains <a class="reference external" href="https://docs.python.org/3/glossary.html#term-mutable" title="(in Python v3.9)"><span class="xref std std-term">mutable</span></a> values like lists or dictionaries,
│ │ │ +<p>If your item contains <a class="reference external" href="https://docs.python.org/3/glossary.html#term-mutable" title="(in Python v3.10)"><span class="xref std std-term">mutable</span></a> values like lists or dictionaries,
│ │ │  a shallow copy will keep references to the same mutable values across all
│ │ │  different copies.</p>
│ │ │  <p>For example, if you have an item with a list of tags, and you create a shallow
│ │ │  copy of that item, both the original item and the copy have the same list of
│ │ │  tags. Adding a tag to the list of one of the items will add the tag to the
│ │ │  other item as well.</p>
│ │ │  <p>If that is not the desired behavior, use a deep copy instead.</p>
│ │ │ -<p>See <a class="reference external" href="https://docs.python.org/3/library/copy.html#module-copy" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">copy</span></code></a> for more information.</p>
│ │ │ +<p>See <a class="reference external" href="https://docs.python.org/3/library/copy.html#module-copy" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">copy</span></code></a> for more information.</p>
│ │ │  <p>To create a shallow copy of an item, you can either call
│ │ │  <a class="reference internal" href="#scrapy.item.Item.copy" title="scrapy.item.Item.copy"><code class="xref py py-meth docutils literal notranslate"><span class="pre">copy()</span></code></a> on an existing item
│ │ │  (<code class="docutils literal notranslate"><span class="pre">product2</span> <span class="pre">=</span> <span class="pre">product.copy()</span></code>) or instantiate your item class from an existing
│ │ │  item (<code class="docutils literal notranslate"><span class="pre">product2</span> <span class="pre">=</span> <span class="pre">Product(product)</span></code>).</p>
│ │ │  <p>To create a deep copy, call <a class="reference internal" href="#scrapy.item.Item.deepcopy" title="scrapy.item.Item.deepcopy"><code class="xref py py-meth docutils literal notranslate"><span class="pre">deepcopy()</span></code></a> instead
│ │ │  (<code class="docutils literal notranslate"><span class="pre">product2</span> <span class="pre">=</span> <span class="pre">product.deepcopy()</span></code>).</p>
│ │ │  </div>
│ │ │ @@ -583,15 +583,15 @@
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">itemadapter.</code><code class="sig-name descname">ItemAdapter</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">item</span><span class="p">:</span> <span class="n">Any</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemadapter/adapter.html#ItemAdapter"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#itemadapter.ItemAdapter" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Wrapper class to interact with data container objects. It provides a common interface
│ │ │  to extract and set data without having to take the object’s type into account.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py function">
│ │ │  <dt id="itemadapter.is_item">
│ │ │ -<code class="sig-prename descclassname">itemadapter.</code><code class="sig-name descname">is_item</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">obj</span><span class="p">:</span> <span class="n">Any</span></em><span class="sig-paren">)</span> &#x2192; <a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)">bool</a><a class="reference internal" href="../_modules/itemadapter/utils.html#is_item"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#itemadapter.is_item" title="Permalink to this definition">¶</a></dt>
│ │ │ +<code class="sig-prename descclassname">itemadapter.</code><code class="sig-name descname">is_item</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">obj</span><span class="p">:</span> <span class="n">Any</span></em><span class="sig-paren">)</span> &#x2192; <a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)">bool</a><a class="reference internal" href="../_modules/itemadapter/utils.html#is_item"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#itemadapter.is_item" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Return True if the given object belongs to one of the supported types, False otherwise.</p>
│ │ │  <p>Alias for ItemAdapter.is_item</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  <div class="section" id="other-classes-related-to-items">
│ │ │  <h2>Other classes related to items<a class="headerlink" href="#other-classes-related-to-items" title="Permalink to this headline">¶</a></h2>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/jobs.html
│ │ │ @@ -282,15 +282,15 @@
│ │ │  <p>Cookies may expire. So, if you don’t resume your spider quickly the requests
│ │ │  scheduled may no longer work. This won’t be an issue if your spider doesn’t rely
│ │ │  on cookies.</p>
│ │ │  </div>
│ │ │  <div class="section" id="request-serialization">
│ │ │  <span id="id1"></span><h3>Request serialization<a class="headerlink" href="#request-serialization" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>For persistence to work, <a class="reference internal" href="request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> objects must be
│ │ │ -serializable with <a class="reference external" href="https://docs.python.org/3/library/pickle.html#module-pickle" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">pickle</span></code></a>, except for the <code class="docutils literal notranslate"><span class="pre">callback</span></code> and <code class="docutils literal notranslate"><span class="pre">errback</span></code>
│ │ │ +serializable with <a class="reference external" href="https://docs.python.org/3/library/pickle.html#module-pickle" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">pickle</span></code></a>, except for the <code class="docutils literal notranslate"><span class="pre">callback</span></code> and <code class="docutils literal notranslate"><span class="pre">errback</span></code>
│ │ │  values passed to their <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, which must be methods of the
│ │ │  running <a class="reference internal" href="spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> class.</p>
│ │ │  <p>If you wish to log the requests that couldn’t be serialized, you can set the
│ │ │  <a class="reference internal" href="settings.html#std-setting-SCHEDULER_DEBUG"><code class="xref std std-setting docutils literal notranslate"><span class="pre">SCHEDULER_DEBUG</span></code></a> setting to <code class="docutils literal notranslate"><span class="pre">True</span></code> in the project’s settings page.
│ │ │  It is <code class="docutils literal notranslate"><span class="pre">False</span></code> by default.</p>
│ │ │  </div>
│ │ │  </div>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/leaks.html
│ │ │ @@ -382,15 +382,15 @@
│ │ │  
│ │ │  <dl class="py function">
│ │ │  <dt id="scrapy.utils.trackref.print_live_refs">
│ │ │  <code class="sig-prename descclassname">scrapy.utils.trackref.</code><code class="sig-name descname">print_live_refs</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">class_name</span></em>, <em class="sig-param"><span class="n">ignore</span><span class="o">=</span><span class="default_value">NoneType</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/utils/trackref.html#print_live_refs"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.utils.trackref.print_live_refs" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Print a report of live references, grouped by class name.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>ignore</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#type" title="(in Python v3.9)"><em>type</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#tuple" title="(in Python v3.9)"><em>tuple</em></a>) – if given, all objects from the specified class (or tuple of
│ │ │ +<dd class="field-odd"><p><strong>ignore</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#type" title="(in Python v3.10)"><em>type</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#tuple" title="(in Python v3.10)"><em>tuple</em></a>) – if given, all objects from the specified class (or tuple of
│ │ │  classes) will be ignored.</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py function">
│ │ │  <dt id="scrapy.utils.trackref.get_oldest">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/link-extractors.html
│ │ │ @@ -254,61 +254,61 @@
│ │ │  <dt id="scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.linkextractors.lxmlhtml.</code><code class="sig-name descname">LxmlLinkExtractor</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">allow</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">deny</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">allow_domains</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">deny_domains</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">deny_extensions</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">restrict_xpaths</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">restrict_css</span><span class="o">=</span><span class="default_value">()</span></em>, <em class="sig-param"><span class="n">tags</span><span class="o">=</span><span class="default_value">('a', 'area')</span></em>, <em class="sig-param"><span class="n">attrs</span><span class="o">=</span><span class="default_value">('href')</span></em>, <em class="sig-param"><span class="n">canonicalize</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="n">unique</span><span class="o">=</span><span class="default_value">True</span></em>, <em class="sig-param"><span class="n">process_value</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">strip</span><span class="o">=</span><span class="default_value">True</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/linkextractors/lxmlhtml.html#LxmlLinkExtractor"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>LxmlLinkExtractor is the recommended link extractor with handy filtering
│ │ │  options. It is implemented using lxml’s robust HTMLParser.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>allow</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │ +<li><p><strong>allow</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │  that the (absolute) urls must match in order to be extracted. If not
│ │ │  given (or empty), it will match all links.</p></li>
│ │ │ -<li><p><strong>deny</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │ +<li><p><strong>deny</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │  that the (absolute) urls must match in order to be excluded (i.e. not
│ │ │  extracted). It has precedence over the <code class="docutils literal notranslate"><span class="pre">allow</span></code> parameter. If not
│ │ │  given (or empty) it won’t exclude any links.</p></li>
│ │ │ -<li><p><strong>allow_domains</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a single value or a list of string containing
│ │ │ +<li><p><strong>allow_domains</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a single value or a list of string containing
│ │ │  domains which will be considered for extracting the links</p></li>
│ │ │ -<li><p><strong>deny_domains</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a single value or a list of strings containing
│ │ │ +<li><p><strong>deny_domains</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a single value or a list of strings containing
│ │ │  domains which won’t be considered for extracting the links</p></li>
│ │ │ -<li><p><strong>deny_extensions</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – <p>a single value or list of strings containing
│ │ │ +<li><p><strong>deny_extensions</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – <p>a single value or list of strings containing
│ │ │  extensions that should be ignored when extracting links.
│ │ │  If not given, it will default to
│ │ │  <code class="xref py py-data docutils literal notranslate"><span class="pre">scrapy.linkextractors.IGNORED_EXTENSIONS</span></code>.</p>
│ │ │  <div class="versionchanged">
│ │ │  <p><span class="versionmodified changed">Changed in version 2.0: </span><code class="xref py py-data docutils literal notranslate"><span class="pre">IGNORED_EXTENSIONS</span></code> now includes
│ │ │  <code class="docutils literal notranslate"><span class="pre">7z</span></code>, <code class="docutils literal notranslate"><span class="pre">7zip</span></code>, <code class="docutils literal notranslate"><span class="pre">apk</span></code>, <code class="docutils literal notranslate"><span class="pre">bz2</span></code>, <code class="docutils literal notranslate"><span class="pre">cdr</span></code>, <code class="docutils literal notranslate"><span class="pre">dmg</span></code>, <code class="docutils literal notranslate"><span class="pre">ico</span></code>,
│ │ │  <code class="docutils literal notranslate"><span class="pre">iso</span></code>, <code class="docutils literal notranslate"><span class="pre">tar</span></code>, <code class="docutils literal notranslate"><span class="pre">tar.gz</span></code>, <code class="docutils literal notranslate"><span class="pre">webm</span></code>, and <code class="docutils literal notranslate"><span class="pre">xz</span></code>.</p>
│ │ │  </div>
│ │ │  </p></li>
│ │ │ -<li><p><strong>restrict_xpaths</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – is an XPath (or list of XPath’s) which defines
│ │ │ +<li><p><strong>restrict_xpaths</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – is an XPath (or list of XPath’s) which defines
│ │ │  regions inside the response where links should be extracted from.
│ │ │  If given, only the text selected by those XPath will be scanned for
│ │ │  links. See examples below.</p></li>
│ │ │ -<li><p><strong>restrict_css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a CSS selector (or list of selectors) which defines
│ │ │ +<li><p><strong>restrict_css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a CSS selector (or list of selectors) which defines
│ │ │  regions inside the response where links should be extracted from.
│ │ │  Has the same behaviour as <code class="docutils literal notranslate"><span class="pre">restrict_xpaths</span></code>.</p></li>
│ │ │ -<li><p><strong>restrict_text</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │ +<li><p><strong>restrict_text</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a single regular expression (or list of regular expressions)
│ │ │  that the link’s text must match in order to be extracted. If not
│ │ │  given (or empty), it will match all links. If a list of regular expressions is
│ │ │  given, the link will be extracted if it matches at least one.</p></li>
│ │ │ -<li><p><strong>tags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – a tag or a list of tags to consider when extracting links.
│ │ │ +<li><p><strong>tags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – a tag or a list of tags to consider when extracting links.
│ │ │  Defaults to <code class="docutils literal notranslate"><span class="pre">('a',</span> <span class="pre">'area')</span></code>.</p></li>
│ │ │ -<li><p><strong>attrs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – an attribute or list of attributes which should be considered when looking
│ │ │ +<li><p><strong>attrs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – an attribute or list of attributes which should be considered when looking
│ │ │  for links to extract (only for those tags specified in the <code class="docutils literal notranslate"><span class="pre">tags</span></code>
│ │ │  parameter). Defaults to <code class="docutils literal notranslate"><span class="pre">('href',)</span></code></p></li>
│ │ │ -<li><p><strong>canonicalize</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – canonicalize each extracted url (using
│ │ │ +<li><p><strong>canonicalize</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – canonicalize each extracted url (using
│ │ │  w3lib.url.canonicalize_url). Defaults to <code class="docutils literal notranslate"><span class="pre">False</span></code>.
│ │ │  Note that canonicalize_url is meant for duplicate checking;
│ │ │  it can change the URL visible at server side, so the response can be
│ │ │  different for requests with canonicalized and raw URLs. If you’re
│ │ │  using LinkExtractor to follow links it is more robust to
│ │ │  keep the default <code class="docutils literal notranslate"><span class="pre">canonicalize=False</span></code>.</p></li>
│ │ │ -<li><p><strong>unique</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – whether duplicate filtering should be applied to extracted
│ │ │ +<li><p><strong>unique</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – whether duplicate filtering should be applied to extracted
│ │ │  links.</p></li>
│ │ │ -<li><p><strong>process_value</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.9)"><em>collections.abc.Callable</em></a>) – <p>a function which receives each value extracted from
│ │ │ +<li><p><strong>process_value</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.10)"><em>collections.abc.Callable</em></a>) – <p>a function which receives each value extracted from
│ │ │  the tag and attributes scanned and can modify the value and return a
│ │ │  new one, or return <code class="docutils literal notranslate"><span class="pre">None</span></code> to ignore the link altogether. If not
│ │ │  given, <code class="docutils literal notranslate"><span class="pre">process_value</span></code> defaults to <code class="docutils literal notranslate"><span class="pre">lambda</span> <span class="pre">x:</span> <span class="pre">x</span></code>.</p>
│ │ │  <p>For example, to extract links from this code:</p>
│ │ │  <div class="highlight-html notranslate"><div class="highlight"><pre><span></span><span class="p">&lt;</span><span class="nt">a</span> <span class="na">href</span><span class="o">=</span><span class="s">&quot;javascript:goToPage(&#39;../other/page.html&#39;); return false&quot;</span><span class="p">&gt;</span>Link text<span class="p">&lt;/</span><span class="nt">a</span><span class="p">&gt;</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ @@ -316,15 +316,15 @@
│ │ │  <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="k">def</span> <span class="nf">process_value</span><span class="p">(</span><span class="n">value</span><span class="p">):</span>
│ │ │      <span class="n">m</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">search</span><span class="p">(</span><span class="s2">&quot;javascript:goToPage\(&#39;(.*?)&#39;&quot;</span><span class="p">,</span> <span class="n">value</span><span class="p">)</span>
│ │ │      <span class="k">if</span> <span class="n">m</span><span class="p">:</span>
│ │ │          <span class="k">return</span> <span class="n">m</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </p></li>
│ │ │ -<li><p><strong>strip</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – whether to strip whitespaces from extracted attributes.
│ │ │ +<li><p><strong>strip</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – whether to strip whitespaces from extracted attributes.
│ │ │  According to HTML5 standard, leading and trailing whitespaces
│ │ │  must be stripped from <code class="docutils literal notranslate"><span class="pre">href</span></code> attributes of <code class="docutils literal notranslate"><span class="pre">&lt;a&gt;</span></code>, <code class="docutils literal notranslate"><span class="pre">&lt;area&gt;</span></code>
│ │ │  and many other elements, <code class="docutils literal notranslate"><span class="pre">src</span></code> attribute of <code class="docutils literal notranslate"><span class="pre">&lt;img&gt;</span></code>, <code class="docutils literal notranslate"><span class="pre">&lt;iframe&gt;</span></code>
│ │ │  elements, etc., so LinkExtractor strips space chars by default.
│ │ │  Set <code class="docutils literal notranslate"><span class="pre">strip=False</span></code> to turn it off (e.g. if you’re extracting urls
│ │ │  from elements or attributes which allow leading/trailing whitespaces).</p></li>
│ │ │  </ul>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/loaders.html
│ │ │ @@ -300,15 +300,15 @@
│ │ │  <span id="topics-loaders-dataclass"></span><h2>Working with dataclass items<a class="headerlink" href="#working-with-dataclass-items" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>By default, <a class="reference internal" href="items.html#dataclass-items"><span class="std std-ref">dataclass items</span></a> require all fields to be
│ │ │  passed when created. This could be an issue when using dataclass items with
│ │ │  item loaders: unless a pre-populated item is passed to the loader, fields
│ │ │  will be populated incrementally using the loader’s <a class="reference internal" href="#scrapy.loader.ItemLoader.add_xpath" title="scrapy.loader.ItemLoader.add_xpath"><code class="xref py py-meth docutils literal notranslate"><span class="pre">add_xpath()</span></code></a>,
│ │ │  <a class="reference internal" href="#scrapy.loader.ItemLoader.add_css" title="scrapy.loader.ItemLoader.add_css"><code class="xref py py-meth docutils literal notranslate"><span class="pre">add_css()</span></code></a> and <a class="reference internal" href="#scrapy.loader.ItemLoader.add_value" title="scrapy.loader.ItemLoader.add_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">add_value()</span></code></a> methods.</p>
│ │ │  <p>One approach to overcome this is to define items using the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.field" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">field()</span></code></a> function, with a <code class="docutils literal notranslate"><span class="pre">default</span></code> argument:</p>
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/dataclasses.html#dataclasses.field" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">field()</span></code></a> function, with a <code class="docutils literal notranslate"><span class="pre">default</span></code> argument:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">dataclasses</span> <span class="kn">import</span> <span class="n">dataclass</span><span class="p">,</span> <span class="n">field</span>
│ │ │  <span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Optional</span>
│ │ │  
│ │ │  <span class="nd">@dataclass</span>
│ │ │  <span class="k">class</span> <span class="nc">InventoryItem</span><span class="p">:</span>
│ │ │      <span class="n">name</span><span class="p">:</span> <span class="n">Optional</span><span class="p">[</span><span class="nb">str</span><span class="p">]</span> <span class="o">=</span> <span class="n">field</span><span class="p">(</span><span class="n">default</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
│ │ │      <span class="n">price</span><span class="p">:</span> <span class="n">Optional</span><span class="p">[</span><span class="nb">float</span><span class="p">]</span> <span class="o">=</span> <span class="n">field</span><span class="p">(</span><span class="n">default</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
│ │ │ @@ -581,15 +581,15 @@
│ │ │  <code class="sig-name descname">add_css</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">field_name</span></em>, <em class="sig-param"><span class="n">css</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">processors</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kw</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemloaders.html#ItemLoader.add_css"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.loader.ItemLoader.add_css" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Similar to <a class="reference internal" href="#scrapy.loader.ItemLoader.add_value" title="scrapy.loader.ItemLoader.add_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.add_value()</span></code></a> but receives a CSS selector
│ │ │  instead of a value, which is used to extract a list of unicode strings
│ │ │  from the selector associated with this <a class="reference internal" href="#scrapy.loader.ItemLoader" title="scrapy.loader.ItemLoader"><code class="xref py py-class docutils literal notranslate"><span class="pre">ItemLoader</span></code></a>.</p>
│ │ │  <p>See <a class="reference internal" href="#scrapy.loader.ItemLoader.get_css" title="scrapy.loader.ItemLoader.get_css"><code class="xref py py-meth docutils literal notranslate"><span class="pre">get_css()</span></code></a> for <code class="docutils literal notranslate"><span class="pre">kwargs</span></code>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the CSS selector to extract data from</p>
│ │ │ +<dd class="field-odd"><p><strong>css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the CSS selector to extract data from</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>Examples:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="c1"># HTML snippet: &lt;p class=&quot;product-name&quot;&gt;Color TV&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">add_css</span><span class="p">(</span><span class="s1">&#39;name&#39;</span><span class="p">,</span> <span class="s1">&#39;p.product-name&#39;</span><span class="p">)</span>
│ │ │  <span class="c1"># HTML snippet: &lt;p id=&quot;price&quot;&gt;the price is $1200&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">add_css</span><span class="p">(</span><span class="s1">&#39;price&#39;</span><span class="p">,</span> <span class="s1">&#39;p#price&#39;</span><span class="p">,</span> <span class="n">re</span><span class="o">=</span><span class="s1">&#39;the price is (.*)&#39;</span><span class="p">)</span>
│ │ │ @@ -624,15 +624,15 @@
│ │ │  <code class="sig-name descname">add_xpath</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">field_name</span></em>, <em class="sig-param"><span class="n">xpath</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">processors</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kw</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemloaders.html#ItemLoader.add_xpath"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.loader.ItemLoader.add_xpath" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Similar to <a class="reference internal" href="#scrapy.loader.ItemLoader.add_value" title="scrapy.loader.ItemLoader.add_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.add_value()</span></code></a> but receives an XPath instead of a
│ │ │  value, which is used to extract a list of strings from the
│ │ │  selector associated with this <a class="reference internal" href="#scrapy.loader.ItemLoader" title="scrapy.loader.ItemLoader"><code class="xref py py-class docutils literal notranslate"><span class="pre">ItemLoader</span></code></a>.</p>
│ │ │  <p>See <a class="reference internal" href="#scrapy.loader.ItemLoader.get_xpath" title="scrapy.loader.ItemLoader.get_xpath"><code class="xref py py-meth docutils literal notranslate"><span class="pre">get_xpath()</span></code></a> for <code class="docutils literal notranslate"><span class="pre">kwargs</span></code>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>xpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the XPath to extract data from</p>
│ │ │ +<dd class="field-odd"><p><strong>xpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the XPath to extract data from</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>Examples:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="c1"># HTML snippet: &lt;p class=&quot;product-name&quot;&gt;Color TV&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">add_xpath</span><span class="p">(</span><span class="s1">&#39;name&#39;</span><span class="p">,</span> <span class="s1">&#39;//p[@class=&quot;product-name&quot;]&#39;</span><span class="p">)</span>
│ │ │  <span class="c1"># HTML snippet: &lt;p id=&quot;price&quot;&gt;the price is $1200&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">add_xpath</span><span class="p">(</span><span class="s1">&#39;price&#39;</span><span class="p">,</span> <span class="s1">&#39;//p[@id=&quot;price&quot;]&#39;</span><span class="p">,</span> <span class="n">re</span><span class="o">=</span><span class="s1">&#39;the price is (.*)&#39;</span><span class="p">)</span>
│ │ │ @@ -651,16 +651,16 @@
│ │ │  <code class="sig-name descname">get_css</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">css</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">processors</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kw</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemloaders.html#ItemLoader.get_css"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.loader.ItemLoader.get_css" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Similar to <a class="reference internal" href="#scrapy.loader.ItemLoader.get_value" title="scrapy.loader.ItemLoader.get_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.get_value()</span></code></a> but receives a CSS selector
│ │ │  instead of a value, which is used to extract a list of unicode strings
│ │ │  from the selector associated with this <a class="reference internal" href="#scrapy.loader.ItemLoader" title="scrapy.loader.ItemLoader"><code class="xref py py-class docutils literal notranslate"><span class="pre">ItemLoader</span></code></a>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the CSS selector to extract data from</p></li>
│ │ │ -<li><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.9)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │ +<li><p><strong>css</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the CSS selector to extract data from</p></li>
│ │ │ +<li><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.10)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │  selected CSS region</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>Examples:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="c1"># HTML snippet: &lt;p class=&quot;product-name&quot;&gt;Color TV&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">get_css</span><span class="p">(</span><span class="s1">&#39;p.product-name&#39;</span><span class="p">)</span>
│ │ │ @@ -681,15 +681,15 @@
│ │ │  <dt id="scrapy.loader.ItemLoader.get_value">
│ │ │  <code class="sig-name descname">get_value</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">value</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">processors</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kw</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemloaders.html#ItemLoader.get_value"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.loader.ItemLoader.get_value" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Process the given <code class="docutils literal notranslate"><span class="pre">value</span></code> by the given <code class="docutils literal notranslate"><span class="pre">processors</span></code> and keyword
│ │ │  arguments.</p>
│ │ │  <p>Available keyword arguments:</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.9)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │ +<dd class="field-odd"><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.10)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │  given value using <code class="xref py py-func docutils literal notranslate"><span class="pre">extract_regex()</span></code> method,
│ │ │  applied before processors</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>Examples:</p>
│ │ │  <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">itemloaders</span> <span class="kn">import</span> <span class="n">ItemLoader</span>
│ │ │  <span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">itemloaders.processors</span> <span class="kn">import</span> <span class="n">TakeFirst</span>
│ │ │ @@ -705,16 +705,16 @@
│ │ │  <code class="sig-name descname">get_xpath</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">xpath</span></em>, <em class="sig-param"><span class="o">*</span><span class="n">processors</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kw</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/itemloaders.html#ItemLoader.get_xpath"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.loader.ItemLoader.get_xpath" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Similar to <a class="reference internal" href="#scrapy.loader.ItemLoader.get_value" title="scrapy.loader.ItemLoader.get_value"><code class="xref py py-meth docutils literal notranslate"><span class="pre">ItemLoader.get_value()</span></code></a> but receives an XPath instead of a
│ │ │  value, which is used to extract a list of unicode strings from the
│ │ │  selector associated with this <a class="reference internal" href="#scrapy.loader.ItemLoader" title="scrapy.loader.ItemLoader"><code class="xref py py-class docutils literal notranslate"><span class="pre">ItemLoader</span></code></a>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>xpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the XPath to extract data from</p></li>
│ │ │ -<li><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.9)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │ +<li><p><strong>xpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the XPath to extract data from</p></li>
│ │ │ +<li><p><strong>re</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/typing.html#typing.Pattern" title="(in Python v3.10)"><em>typing.Pattern</em></a>) – a regular expression to use for extracting data from the
│ │ │  selected XPath region</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>Examples:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="c1"># HTML snippet: &lt;p class=&quot;product-name&quot;&gt;Color TV&lt;/p&gt;</span>
│ │ │  <span class="n">loader</span><span class="o">.</span><span class="n">get_xpath</span><span class="p">(</span><span class="s1">&#39;//p[@class=&quot;product-name&quot;]&#39;</span><span class="p">)</span>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/logging.html
│ │ │ @@ -232,15 +232,15 @@
│ │ │  <span id="topics-logging"></span><h1>Logging<a class="headerlink" href="#logging" title="Permalink to this headline">¶</a></h1>
│ │ │  <div class="admonition note">
│ │ │  <p class="admonition-title">Note</p>
│ │ │  <p><code class="xref py py-mod docutils literal notranslate"><span class="pre">scrapy.log</span></code> has been deprecated alongside its functions in favor of
│ │ │  explicit calls to the Python standard logging. Keep reading to learn more
│ │ │  about the new logging system.</p>
│ │ │  </div>
│ │ │ -<p>Scrapy uses <a class="reference external" href="https://docs.python.org/3/library/logging.html#module-logging" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">logging</span></code></a> for event logging. We’ll
│ │ │ +<p>Scrapy uses <a class="reference external" href="https://docs.python.org/3/library/logging.html#module-logging" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">logging</span></code></a> for event logging. We’ll
│ │ │  provide some simple examples to get you started, but for more advanced
│ │ │  use-cases it’s strongly suggested to read thoroughly its documentation.</p>
│ │ │  <p>Logging works out of the box, and can be configured to some extent with the
│ │ │  Scrapy settings listed in <a class="reference internal" href="#topics-logging-settings"><span class="std std-ref">Logging settings</span></a>.</p>
│ │ │  <p>Scrapy calls <a class="reference internal" href="#scrapy.utils.log.configure_logging" title="scrapy.utils.log.configure_logging"><code class="xref py py-func docutils literal notranslate"><span class="pre">scrapy.utils.log.configure_logging()</span></code></a> to set some reasonable
│ │ │  defaults and handle those settings in <a class="reference internal" href="#topics-logging-settings"><span class="std std-ref">Logging settings</span></a> when
│ │ │  running commands, so it’s recommended to manually call it if you’re running
│ │ │ @@ -299,17 +299,17 @@
│ │ │  <span class="n">logger</span> <span class="o">=</span> <span class="n">logging</span><span class="o">.</span><span class="n">getLogger</span><span class="p">(</span><span class="vm">__name__</span><span class="p">)</span>
│ │ │  <span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">&quot;This is a warning&quot;</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <div class="admonition seealso">
│ │ │  <p class="admonition-title">See also</p>
│ │ │  <dl class="simple">
│ │ │ -<dt>Module logging, <a class="reference external" href="https://docs.python.org/3/howto/logging.html" title="(in Python v3.9)"><span class="xref std std-doc">HowTo</span></a></dt><dd><p>Basic Logging Tutorial</p>
│ │ │ +<dt>Module logging, <a class="reference external" href="https://docs.python.org/3/howto/logging.html" title="(in Python v3.10)"><span class="xref std std-doc">HowTo</span></a></dt><dd><p>Basic Logging Tutorial</p>
│ │ │  </dd>
│ │ │ -<dt>Module logging, <a class="reference external" href="https://docs.python.org/3/library/logging.html#logger" title="(in Python v3.9)"><span class="xref std std-ref">Loggers</span></a></dt><dd><p>Further documentation on loggers</p>
│ │ │ +<dt>Module logging, <a class="reference external" href="https://docs.python.org/3/library/logging.html#logger" title="(in Python v3.10)"><span class="xref std std-ref">Loggers</span></a></dt><dd><p>Further documentation on loggers</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="logging-from-spiders">
│ │ │  <span id="topics-logging-from-spiders"></span><h2>Logging from Spiders<a class="headerlink" href="#logging-from-spiders" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Scrapy provides a <a class="reference internal" href="spiders.html#scrapy.spiders.Spider.logger" title="scrapy.spiders.Spider.logger"><code class="xref py py-data docutils literal notranslate"><span class="pre">logger</span></code></a> within each Spider
│ │ │ @@ -370,16 +370,16 @@
│ │ │  messages will be displayed on the standard error. Lastly, if
│ │ │  <a class="reference internal" href="settings.html#std-setting-LOG_ENABLED"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_ENABLED</span></code></a> is <code class="docutils literal notranslate"><span class="pre">False</span></code>, there won’t be any visible log output.</p>
│ │ │  <p><a class="reference internal" href="settings.html#std-setting-LOG_LEVEL"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_LEVEL</span></code></a> determines the minimum level of severity to display, those
│ │ │  messages with lower severity will be filtered out. It ranges through the
│ │ │  possible levels listed in <a class="reference internal" href="#topics-logging-levels"><span class="std std-ref">Log levels</span></a>.</p>
│ │ │  <p><a class="reference internal" href="settings.html#std-setting-LOG_FORMAT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_FORMAT</span></code></a> and <a class="reference internal" href="settings.html#std-setting-LOG_DATEFORMAT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_DATEFORMAT</span></code></a> specify formatting strings
│ │ │  used as layouts for all messages. Those strings can contain any placeholders
│ │ │ -listed in <a class="reference external" href="https://docs.python.org/3/library/logging.html#logrecord-attributes" title="(in Python v3.9)"><span class="xref std std-ref">logging’s logrecord attributes docs</span></a> and
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/datetime.html#strftime-strptime-behavior" title="(in Python v3.9)"><span class="xref std std-ref">datetime’s strftime and strptime directives</span></a>
│ │ │ +listed in <a class="reference external" href="https://docs.python.org/3/library/logging.html#logrecord-attributes" title="(in Python v3.10)"><span class="xref std std-ref">logging’s logrecord attributes docs</span></a> and
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/datetime.html#strftime-strptime-behavior" title="(in Python v3.10)"><span class="xref std std-ref">datetime’s strftime and strptime directives</span></a>
│ │ │  respectively.</p>
│ │ │  <p>If <a class="reference internal" href="settings.html#std-setting-LOG_SHORT_NAMES"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_SHORT_NAMES</span></code></a> is set, then the logs will not display the Scrapy
│ │ │  component that prints the log. It is unset by default, hence logs contain the
│ │ │  Scrapy component responsible for that log output.</p>
│ │ │  </div>
│ │ │  <div class="section" id="command-line-options">
│ │ │  <h3>Command-line options<a class="headerlink" href="#command-line-options" title="Permalink to this headline">¶</a></h3>
│ │ │ @@ -401,15 +401,15 @@
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </li>
│ │ │  </ul>
│ │ │  <div class="admonition seealso">
│ │ │  <p class="admonition-title">See also</p>
│ │ │  <dl class="simple">
│ │ │ -<dt>Module <a class="reference external" href="https://docs.python.org/3/library/logging.handlers.html#module-logging.handlers" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">logging.handlers</span></code></a></dt><dd><p>Further documentation on available handlers</p>
│ │ │ +<dt>Module <a class="reference external" href="https://docs.python.org/3/library/logging.handlers.html#module-logging.handlers" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">logging.handlers</span></code></a></dt><dd><p>Further documentation on available handlers</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="custom-log-formats">
│ │ │  <span id="id1"></span><h3>Custom Log Formats<a class="headerlink" href="#custom-log-formats" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>A custom log format can be set for different actions by extending
│ │ │ @@ -543,15 +543,15 @@
│ │ │  <code class="sig-prename descclassname">scrapy.utils.log.</code><code class="sig-name descname">configure_logging</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">settings</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">install_root_handler</span><span class="o">=</span><span class="default_value">True</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/utils/log.html#configure_logging"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.utils.log.configure_logging" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Initialize logging defaults for Scrapy.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>settings</strong> (dict, <a class="reference internal" href="api.html#scrapy.settings.Settings" title="scrapy.settings.Settings"><code class="xref py py-class docutils literal notranslate"><span class="pre">Settings</span></code></a> object or <code class="docutils literal notranslate"><span class="pre">None</span></code>) – settings used to create and configure a handler for the
│ │ │  root logger (default: None).</p></li>
│ │ │ -<li><p><strong>install_root_handler</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – whether to install root logging handler
│ │ │ +<li><p><strong>install_root_handler</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – whether to install root logging handler
│ │ │  (default: True)</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>This function does:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>Route warnings and twisted logging through Python standard logging</p></li>
│ │ │ @@ -564,17 +564,17 @@
│ │ │  using <code class="docutils literal notranslate"><span class="pre">settings</span></code> argument. When <code class="docutils literal notranslate"><span class="pre">settings</span></code> is empty or None, defaults
│ │ │  are used.</p>
│ │ │  <p><code class="docutils literal notranslate"><span class="pre">configure_logging</span></code> is automatically called when using Scrapy commands
│ │ │  or <a class="reference internal" href="api.html#scrapy.crawler.CrawlerProcess" title="scrapy.crawler.CrawlerProcess"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerProcess</span></code></a>, but needs to be called explicitly
│ │ │  when running custom scripts using <a class="reference internal" href="api.html#scrapy.crawler.CrawlerRunner" title="scrapy.crawler.CrawlerRunner"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerRunner</span></code></a>.
│ │ │  In that case, its usage is not required but it’s recommended.</p>
│ │ │  <p>Another option when running custom scripts is to manually configure the logging.
│ │ │ -To do this you can use <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> to set a basic root handler.</p>
│ │ │ +To do this you can use <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> to set a basic root handler.</p>
│ │ │  <p>Note that <a class="reference internal" href="api.html#scrapy.crawler.CrawlerProcess" title="scrapy.crawler.CrawlerProcess"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerProcess</span></code></a> automatically calls <code class="docutils literal notranslate"><span class="pre">configure_logging</span></code>,
│ │ │ -so it is recommended to only use <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> together with
│ │ │ +so it is recommended to only use <a class="reference external" href="https://docs.python.org/3/library/logging.html#logging.basicConfig" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">logging.basicConfig()</span></code></a> together with
│ │ │  <a class="reference internal" href="api.html#scrapy.crawler.CrawlerRunner" title="scrapy.crawler.CrawlerRunner"><code class="xref py py-class docutils literal notranslate"><span class="pre">CrawlerRunner</span></code></a>.</p>
│ │ │  <p>This is an example on how to redirect <code class="docutils literal notranslate"><span class="pre">INFO</span></code> or higher messages to a file:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">logging</span>
│ │ │  
│ │ │  <span class="n">logging</span><span class="o">.</span><span class="n">basicConfig</span><span class="p">(</span>
│ │ │      <span class="n">filename</span><span class="o">=</span><span class="s1">&#39;log.txt&#39;</span><span class="p">,</span>
│ │ │      <span class="nb">format</span><span class="o">=</span><span class="s1">&#39;</span><span class="si">%(levelname)s</span><span class="s1">: </span><span class="si">%(message)s</span><span class="s1">&#39;</span><span class="p">,</span>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/practices.html
│ │ │ @@ -300,15 +300,15 @@
│ │ │  <span class="n">d</span> <span class="o">=</span> <span class="n">runner</span><span class="o">.</span><span class="n">crawl</span><span class="p">(</span><span class="n">MySpider</span><span class="p">)</span>
│ │ │  <span class="n">d</span><span class="o">.</span><span class="n">addBoth</span><span class="p">(</span><span class="k">lambda</span> <span class="n">_</span><span class="p">:</span> <span class="n">reactor</span><span class="o">.</span><span class="n">stop</span><span class="p">())</span>
│ │ │  <span class="n">reactor</span><span class="o">.</span><span class="n">run</span><span class="p">()</span> <span class="c1"># the script will block here until the crawling is finished</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <div class="admonition seealso">
│ │ │  <p class="admonition-title">See also</p>
│ │ │ -<p><a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/reactor-basics.html" title="(in Twisted v20.3)"><span>Reactor Overview</span></a></p>
│ │ │ +<p><a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/reactor-basics.html" title="(in Twisted v21.2)"><span>Reactor Overview</span></a></p>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="running-multiple-spiders-in-the-same-process">
│ │ │  <span id="run-multiple-spiders"></span><h2>Running multiple spiders in the same process<a class="headerlink" href="#running-multiple-spiders-in-the-same-process" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>By default, Scrapy runs a single spider per process when you run <code class="docutils literal notranslate"><span class="pre">scrapy</span>
│ │ │  <span class="pre">crawl</span></code>. However, Scrapy supports running multiple spiders per process using
│ │ │  the <a class="reference internal" href="api.html#topics-api"><span class="std std-ref">internal API</span></a>.</p>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/request-response.html
│ │ │ @@ -269,45 +269,45 @@
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.http.</code><code class="sig-name descname">Request</code><span class="sig-paren">(</span><em class="sig-param"><span class="o">*</span><span class="n">args</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/http/request.html#Request"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.Request" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> object represents an HTTP request, which is usually
│ │ │  generated in the Spider and executed by the Downloader, and thus generating
│ │ │  a <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a>.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – <p>the URL of this request</p>
│ │ │ -<p>If the URL is invalid, a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#ValueError" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">ValueError</span></code></a> exception is raised.</p>
│ │ │ +<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – <p>the URL of this request</p>
│ │ │ +<p>If the URL is invalid, a <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#ValueError" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">ValueError</span></code></a> exception is raised.</p>
│ │ │  </p></li>
│ │ │ -<li><p><strong>callback</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.9)"><em>collections.abc.Callable</em></a>) – the function that will be called with the response of this
│ │ │ +<li><p><strong>callback</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.10)"><em>collections.abc.Callable</em></a>) – the function that will be called with the response of this
│ │ │  request (once it’s downloaded) as its first parameter. For more information
│ │ │  see <a class="reference internal" href="#topics-request-response-ref-request-callback-arguments"><span class="std std-ref">Passing additional data to callback functions</span></a> below.
│ │ │  If a Request doesn’t specify a callback, the spider’s
│ │ │  <a class="reference internal" href="spiders.html#scrapy.spiders.Spider.parse" title="scrapy.spiders.Spider.parse"><code class="xref py py-meth docutils literal notranslate"><span class="pre">parse()</span></code></a> method will be used.
│ │ │  Note that if exceptions are raised during processing, errback is called instead.</p></li>
│ │ │ -<li><p><strong>method</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the HTTP method of this request. Defaults to <code class="docutils literal notranslate"><span class="pre">'GET'</span></code>.</p></li>
│ │ │ -<li><p><strong>meta</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – the initial values for the <a class="reference internal" href="#scrapy.http.Request.meta" title="scrapy.http.Request.meta"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.meta</span></code></a> attribute. If
│ │ │ +<li><p><strong>method</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the HTTP method of this request. Defaults to <code class="docutils literal notranslate"><span class="pre">'GET'</span></code>.</p></li>
│ │ │ +<li><p><strong>meta</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – the initial values for the <a class="reference internal" href="#scrapy.http.Request.meta" title="scrapy.http.Request.meta"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.meta</span></code></a> attribute. If
│ │ │  given, the dict passed in this parameter will be shallow copied.</p></li>
│ │ │ -<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><em>bytes</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the request body. If a string is passed, then it’s encoded as
│ │ │ +<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><em>bytes</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the request body. If a string is passed, then it’s encoded as
│ │ │  bytes using the <code class="docutils literal notranslate"><span class="pre">encoding</span></code> passed (which defaults to <code class="docutils literal notranslate"><span class="pre">utf-8</span></code>). If
│ │ │  <code class="docutils literal notranslate"><span class="pre">body</span></code> is not given, an empty bytes object is stored. Regardless of the
│ │ │  type of this argument, the final value stored will be a bytes object
│ │ │  (never a string or <code class="docutils literal notranslate"><span class="pre">None</span></code>).</p></li>
│ │ │ -<li><p><strong>headers</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – <p>the headers of this request. The dict values can be strings
│ │ │ +<li><p><strong>headers</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – <p>the headers of this request. The dict values can be strings
│ │ │  (for single valued headers) or lists (for multi-valued headers). If
│ │ │  <code class="docutils literal notranslate"><span class="pre">None</span></code> is passed as value, the HTTP header will not be sent at all.</p>
│ │ │  <blockquote>
│ │ │  <div><div class="admonition caution">
│ │ │  <p class="admonition-title">Caution</p>
│ │ │  <p>Cookies set via the <code class="docutils literal notranslate"><span class="pre">Cookie</span></code> header are not considered by the
│ │ │  <a class="reference internal" href="downloader-middleware.html#cookies-mw"><span class="std std-ref">CookiesMiddleware</span></a>. If you need to set cookies for a request, use the
│ │ │  <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request.cookies</span></code></a> parameter. This is a known
│ │ │  current limitation that is being worked on.</p>
│ │ │  </div>
│ │ │  </div></blockquote>
│ │ │  </p></li>
│ │ │ -<li><p><strong>cookies</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – <p>the request cookies. These can be sent in two forms.</p>
│ │ │ +<li><p><strong>cookies</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – <p>the request cookies. These can be sent in two forms.</p>
│ │ │  <ol class="arabic">
│ │ │  <li><p>Using a dict:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">request_with_cookies</span> <span class="o">=</span> <span class="n">Request</span><span class="p">(</span><span class="n">url</span><span class="o">=</span><span class="s2">&quot;http://www.example.com&quot;</span><span class="p">,</span>
│ │ │                                 <span class="n">cookies</span><span class="o">=</span><span class="p">{</span><span class="s1">&#39;currency&#39;</span><span class="p">:</span> <span class="s1">&#39;USD&#39;</span><span class="p">,</span> <span class="s1">&#39;country&#39;</span><span class="p">:</span> <span class="s1">&#39;UY&#39;</span><span class="p">})</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </li>
│ │ │ @@ -344,38 +344,38 @@
│ │ │  <p class="admonition-title">Caution</p>
│ │ │  <p>Cookies set via the <code class="docutils literal notranslate"><span class="pre">Cookie</span></code> header are not considered by the
│ │ │  <a class="reference internal" href="downloader-middleware.html#cookies-mw"><span class="std std-ref">CookiesMiddleware</span></a>. If you need to set cookies for a request, use the
│ │ │  <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request.cookies</span></code></a> parameter. This is a known
│ │ │  current limitation that is being worked on.</p>
│ │ │  </div>
│ │ │  </p></li>
│ │ │ -<li><p><strong>encoding</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the encoding of this request (defaults to <code class="docutils literal notranslate"><span class="pre">'utf-8'</span></code>).
│ │ │ +<li><p><strong>encoding</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the encoding of this request (defaults to <code class="docutils literal notranslate"><span class="pre">'utf-8'</span></code>).
│ │ │  This encoding will be used to percent-encode the URL and to convert the
│ │ │  body to bytes (if given as a string).</p></li>
│ │ │ -<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the priority of this request (defaults to <code class="docutils literal notranslate"><span class="pre">0</span></code>).
│ │ │ +<li><p><strong>priority</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the priority of this request (defaults to <code class="docutils literal notranslate"><span class="pre">0</span></code>).
│ │ │  The priority is used by the scheduler to define the order used to process
│ │ │  requests.  Requests with a higher priority value will execute earlier.
│ │ │  Negative values are allowed in order to indicate relatively low-priority.</p></li>
│ │ │ -<li><p><strong>dont_filter</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – indicates that this request should not be filtered by
│ │ │ +<li><p><strong>dont_filter</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – indicates that this request should not be filtered by
│ │ │  the scheduler. This is used when you want to perform an identical
│ │ │  request multiple times, to ignore the duplicates filter. Use it with
│ │ │  care, or you will get into crawling loops. Default to <code class="docutils literal notranslate"><span class="pre">False</span></code>.</p></li>
│ │ │ -<li><p><strong>errback</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.9)"><em>collections.abc.Callable</em></a>) – <p>a function that will be called if any exception was
│ │ │ +<li><p><strong>errback</strong> (<a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Callable" title="(in Python v3.10)"><em>collections.abc.Callable</em></a>) – <p>a function that will be called if any exception was
│ │ │  raised while processing the request. This includes pages that failed
│ │ │  with 404 HTTP errors and such. It receives a
│ │ │  <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.python.failure.Failure.html" title="(in Twisted v2.0)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Failure</span></code></a> as first parameter.
│ │ │  For more information,
│ │ │  see <a class="reference internal" href="#topics-request-response-ref-errbacks"><span class="std std-ref">Using errbacks to catch exceptions in request processing</span></a> below.</p>
│ │ │  <div class="versionchanged">
│ │ │  <p><span class="versionmodified changed">Changed in version 2.0: </span>The <em>callback</em> parameter is no longer required when the <em>errback</em>
│ │ │  parameter is specified.</p>
│ │ │  </div>
│ │ │  </p></li>
│ │ │ -<li><p><strong>flags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – Flags sent to the request, can be used for logging or similar purposes.</p></li>
│ │ │ -<li><p><strong>cb_kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – A dict with arbitrary data that will be passed as keyword arguments to the Request’s callback.</p></li>
│ │ │ +<li><p><strong>flags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – Flags sent to the request, can be used for logging or similar purposes.</p></li>
│ │ │ +<li><p><strong>cb_kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – A dict with arbitrary data that will be passed as keyword arguments to the Request’s callback.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <dl class="py attribute">
│ │ │  <dt id="scrapy.http.Request.url">
│ │ │  <code class="sig-name descname">url</code><a class="headerlink" href="#scrapy.http.Request.url" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A string containing the URL of this request. Keep in mind that this
│ │ │ @@ -411,27 +411,27 @@
│ │ │  <code class="sig-name descname">meta</code><a class="headerlink" href="#scrapy.http.Request.meta" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A dict that contains arbitrary metadata for this request. This dict is
│ │ │  empty for new Requests, and is usually  populated by different Scrapy
│ │ │  components (extensions, middlewares, etc). So the data contained in this
│ │ │  dict depends on the extensions you have enabled.</p>
│ │ │  <p>See <a class="reference internal" href="#topics-request-meta"><span class="std std-ref">Request.meta special keys</span></a> for a list of special meta keys
│ │ │  recognized by Scrapy.</p>
│ │ │ -<p>This dict is <a class="reference external" href="https://docs.python.org/3/library/copy.html" title="(in Python v3.9)"><span class="xref std std-doc">shallow copied</span></a> when the request is
│ │ │ +<p>This dict is <a class="reference external" href="https://docs.python.org/3/library/copy.html" title="(in Python v3.10)"><span class="xref std std-doc">shallow copied</span></a> when the request is
│ │ │  cloned using the <code class="docutils literal notranslate"><span class="pre">copy()</span></code> or <code class="docutils literal notranslate"><span class="pre">replace()</span></code> methods, and can also be
│ │ │  accessed, in your spider, from the <code class="docutils literal notranslate"><span class="pre">response.meta</span></code> attribute.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py attribute">
│ │ │  <dt id="scrapy.http.Request.cb_kwargs">
│ │ │  <code class="sig-name descname">cb_kwargs</code><a class="headerlink" href="#scrapy.http.Request.cb_kwargs" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A dictionary that contains arbitrary metadata for this request. Its contents
│ │ │  will be passed to the Request’s callback as keyword arguments. It is empty
│ │ │  for new Requests, which means by default callbacks only get a <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a>
│ │ │  object as argument.</p>
│ │ │ -<p>This dict is <a class="reference external" href="https://docs.python.org/3/library/copy.html" title="(in Python v3.9)"><span class="xref std std-doc">shallow copied</span></a> when the request is
│ │ │ +<p>This dict is <a class="reference external" href="https://docs.python.org/3/library/copy.html" title="(in Python v3.10)"><span class="xref std std-doc">shallow copied</span></a> when the request is
│ │ │  cloned using the <code class="docutils literal notranslate"><span class="pre">copy()</span></code> or <code class="docutils literal notranslate"><span class="pre">replace()</span></code> methods, and can also be
│ │ │  accessed, in your spider, from the <code class="docutils literal notranslate"><span class="pre">response.cb_kwargs</span></code> attribute.</p>
│ │ │  <p>In case of a failure to process the request, this dict can be accessed as
│ │ │  <code class="docutils literal notranslate"><span class="pre">failure.request.cb_kwargs</span></code> in the request’s errback. For more information,
│ │ │  see <a class="reference internal" href="#errback-cb-kwargs"><span class="std std-ref">Accessing additional data in errback functions</span></a>.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │ @@ -717,15 +717,15 @@
│ │ │  <dt id="scrapy.http.FormRequest">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.http.</code><code class="sig-name descname">FormRequest</code><span class="sig-paren">(</span><em class="sig-param">url</em><span class="optional">[</span>, <em class="sig-param">formdata</em>, <em class="sig-param">...</em><span class="optional">]</span><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/http/request/form.html#FormRequest"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.FormRequest" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>The <a class="reference internal" href="#scrapy.http.FormRequest" title="scrapy.http.FormRequest"><code class="xref py py-class docutils literal notranslate"><span class="pre">FormRequest</span></code></a> class adds a new keyword parameter to the <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method. The
│ │ │  remaining arguments are the same as for the <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> class and are
│ │ │  not documented here.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>formdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Iterable" title="(in Python v3.9)"><em>collections.abc.Iterable</em></a>) – is a dictionary (or iterable of (key, value) tuples)
│ │ │ +<dd class="field-odd"><p><strong>formdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a><em> or </em><a class="reference external" href="https://docs.python.org/3/library/collections.abc.html#collections.abc.Iterable" title="(in Python v3.10)"><em>collections.abc.Iterable</em></a>) – is a dictionary (or iterable of (key, value) tuples)
│ │ │  containing HTML Form data which will be url-encoded and assigned to the
│ │ │  body of the request.</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>The <a class="reference internal" href="#scrapy.http.FormRequest" title="scrapy.http.FormRequest"><code class="xref py py-class docutils literal notranslate"><span class="pre">FormRequest</span></code></a> objects support the following class method in
│ │ │  addition to the standard <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> methods:</p>
│ │ │  <dl class="py method">
│ │ │ @@ -752,31 +752,31 @@
│ │ │  <a class="reference external" href="https://bugs.launchpad.net/lxml/+bug/1665241">bug in lxml</a>, which should be fixed in lxml 3.8 and above.</p>
│ │ │  </div>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>response</strong> (<a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> object) – the response containing a HTML form which will be used
│ │ │  to pre-populate the form fields</p></li>
│ │ │ -<li><p><strong>formname</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – if given, the form with name attribute set to this value will be used.</p></li>
│ │ │ -<li><p><strong>formid</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – if given, the form with id attribute set to this value will be used.</p></li>
│ │ │ -<li><p><strong>formxpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – if given, the first form that matches the xpath will be used.</p></li>
│ │ │ -<li><p><strong>formcss</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – if given, the first form that matches the css selector will be used.</p></li>
│ │ │ -<li><p><strong>formnumber</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the number of form to use, when the response contains
│ │ │ +<li><p><strong>formname</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – if given, the form with name attribute set to this value will be used.</p></li>
│ │ │ +<li><p><strong>formid</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – if given, the form with id attribute set to this value will be used.</p></li>
│ │ │ +<li><p><strong>formxpath</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – if given, the first form that matches the xpath will be used.</p></li>
│ │ │ +<li><p><strong>formcss</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – if given, the first form that matches the css selector will be used.</p></li>
│ │ │ +<li><p><strong>formnumber</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the number of form to use, when the response contains
│ │ │  multiple forms. The first one (and also the default) is <code class="docutils literal notranslate"><span class="pre">0</span></code>.</p></li>
│ │ │ -<li><p><strong>formdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – fields to override in the form data. If a field was
│ │ │ +<li><p><strong>formdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – fields to override in the form data. If a field was
│ │ │  already present in the response <code class="docutils literal notranslate"><span class="pre">&lt;form&gt;</span></code> element, its value is
│ │ │  overridden by the one passed in this parameter. If a value passed in
│ │ │  this parameter is <code class="docutils literal notranslate"><span class="pre">None</span></code>, the field will not be included in the
│ │ │  request, even if it was present in the response <code class="docutils literal notranslate"><span class="pre">&lt;form&gt;</span></code> element.</p></li>
│ │ │ -<li><p><strong>clickdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – attributes to lookup the control clicked. If it’s not
│ │ │ +<li><p><strong>clickdata</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – attributes to lookup the control clicked. If it’s not
│ │ │  given, the form data will be submitted simulating a click on the
│ │ │  first clickable element. In addition to html attributes, the control
│ │ │  can be identified by its zero-based index relative to other
│ │ │  submittable inputs inside the form, via the <code class="docutils literal notranslate"><span class="pre">nr</span></code> attribute.</p></li>
│ │ │ -<li><p><strong>dont_click</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.9)"><em>bool</em></a>) – If True, the form data will be submitted without
│ │ │ +<li><p><strong>dont_click</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#bool" title="(in Python v3.10)"><em>bool</em></a>) – If True, the form data will be submitted without
│ │ │  clicking in any element.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p>The other parameters of this class method are passed directly to the
│ │ │  <a class="reference internal" href="#scrapy.http.FormRequest" title="scrapy.http.FormRequest"><code class="xref py py-class docutils literal notranslate"><span class="pre">FormRequest</span></code></a> <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method.</p>
│ │ │  </dd></dl>
│ │ │ @@ -844,19 +844,19 @@
│ │ │  remaining arguments are the same as for the <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> class and are
│ │ │  not documented here.</p>
│ │ │  <p>Using the <a class="reference internal" href="#scrapy.http.JsonRequest" title="scrapy.http.JsonRequest"><code class="xref py py-class docutils literal notranslate"><span class="pre">JsonRequest</span></code></a> will set the <code class="docutils literal notranslate"><span class="pre">Content-Type</span></code> header to <code class="docutils literal notranslate"><span class="pre">application/json</span></code>
│ │ │  and <code class="docutils literal notranslate"><span class="pre">Accept</span></code> header to <code class="docutils literal notranslate"><span class="pre">application/json,</span> <span class="pre">text/javascript,</span> <span class="pre">*/*;</span> <span class="pre">q=0.01</span></code></p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>data</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.9)"><em>object</em></a>) – is any JSON serializable object that needs to be JSON encoded and assigned to body.
│ │ │ +<li><p><strong>data</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#object" title="(in Python v3.10)"><em>object</em></a>) – is any JSON serializable object that needs to be JSON encoded and assigned to body.
│ │ │  if <a class="reference internal" href="#scrapy.http.Request.body" title="scrapy.http.Request.body"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.body</span></code></a> argument is provided this parameter will be ignored.
│ │ │  if <a class="reference internal" href="#scrapy.http.Request.body" title="scrapy.http.Request.body"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.body</span></code></a> argument is not provided and data argument is provided <a class="reference internal" href="#scrapy.http.Request.method" title="scrapy.http.Request.method"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Request.method</span></code></a> will be
│ │ │  set to <code class="docutils literal notranslate"><span class="pre">'POST'</span></code> automatically.</p></li>
│ │ │ -<li><p><strong>dumps_kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – Parameters that will be passed to underlying <a class="reference external" href="https://docs.python.org/3/library/json.html#json.dumps" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.dumps()</span></code></a> method which is used to serialize
│ │ │ +<li><p><strong>dumps_kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – Parameters that will be passed to underlying <a class="reference external" href="https://docs.python.org/3/library/json.html#json.dumps" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.dumps()</span></code></a> method which is used to serialize
│ │ │  data into JSON format.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │ @@ -878,29 +878,29 @@
│ │ │  <dt id="scrapy.http.Response">
│ │ │  <em class="property">class </em><code class="sig-prename descclassname">scrapy.http.</code><code class="sig-name descname">Response</code><span class="sig-paren">(</span><em class="sig-param"><span class="o">*</span><span class="n">args</span></em>, <em class="sig-param"><span class="o">**</span><span class="n">kwargs</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/http/response.html#Response"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.Response" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> object represents an HTTP response, which is usually
│ │ │  downloaded (by the Downloader) and fed to the Spiders for processing.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – the URL of this response</p></li>
│ │ │ -<li><p><strong>status</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.9)"><em>int</em></a>) – the HTTP status of the response. Defaults to <code class="docutils literal notranslate"><span class="pre">200</span></code>.</p></li>
│ │ │ -<li><p><strong>headers</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – the headers of this response. The dict values can be strings
│ │ │ +<li><p><strong>url</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – the URL of this response</p></li>
│ │ │ +<li><p><strong>status</strong> (<a class="reference external" href="https://docs.python.org/3/library/functions.html#int" title="(in Python v3.10)"><em>int</em></a>) – the HTTP status of the response. Defaults to <code class="docutils literal notranslate"><span class="pre">200</span></code>.</p></li>
│ │ │ +<li><p><strong>headers</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – the headers of this response. The dict values can be strings
│ │ │  (for single valued headers) or lists (for multi-valued headers).</p></li>
│ │ │ -<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><em>bytes</em></a>) – the response body. To access the decoded text as a string, use
│ │ │ +<li><p><strong>body</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><em>bytes</em></a>) – the response body. To access the decoded text as a string, use
│ │ │  <code class="docutils literal notranslate"><span class="pre">response.text</span></code> from an encoding-aware
│ │ │  <a class="reference internal" href="#topics-request-response-ref-response-subclasses"><span class="std std-ref">Response subclass</span></a>,
│ │ │  such as <a class="reference internal" href="#scrapy.http.TextResponse" title="scrapy.http.TextResponse"><code class="xref py py-class docutils literal notranslate"><span class="pre">TextResponse</span></code></a>.</p></li>
│ │ │ -<li><p><strong>flags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – is a list containing the initial values for the
│ │ │ +<li><p><strong>flags</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – is a list containing the initial values for the
│ │ │  <a class="reference internal" href="#scrapy.http.Response.flags" title="scrapy.http.Response.flags"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Response.flags</span></code></a> attribute. If given, the list will be shallow
│ │ │  copied.</p></li>
│ │ │  <li><p><strong>request</strong> (<a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><em>scrapy.http.Request</em></a>) – the initial value of the <a class="reference internal" href="#scrapy.http.Response.request" title="scrapy.http.Response.request"><code class="xref py py-attr docutils literal notranslate"><span class="pre">Response.request</span></code></a> attribute.
│ │ │  This represents the <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> that generated this response.</p></li>
│ │ │  <li><p><strong>certificate</strong> (<a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.ssl.Certificate.html" title="(in Twisted v2.0)"><em>twisted.internet.ssl.Certificate</em></a>) – an object representing the server’s SSL certificate.</p></li>
│ │ │ -<li><p><strong>ip_address</strong> (<a class="reference external" href="https://docs.python.org/3/library/ipaddress.html#ipaddress.IPv4Address" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ipaddress.IPv4Address</span></code></a> or <a class="reference external" href="https://docs.python.org/3/library/ipaddress.html#ipaddress.IPv6Address" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ipaddress.IPv6Address</span></code></a>) – The IP address of the server from which the Response originated.</p></li>
│ │ │ +<li><p><strong>ip_address</strong> (<a class="reference external" href="https://docs.python.org/3/library/ipaddress.html#ipaddress.IPv4Address" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ipaddress.IPv4Address</span></code></a> or <a class="reference external" href="https://docs.python.org/3/library/ipaddress.html#ipaddress.IPv6Address" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">ipaddress.IPv6Address</span></code></a>) – The IP address of the server from which the Response originated.</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.1.0: </span>The <code class="docutils literal notranslate"><span class="pre">ip_address</span></code> parameter.</p>
│ │ │  </div>
│ │ │  <dl class="py attribute">
│ │ │ @@ -1036,15 +1036,15 @@
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.http.Response.urljoin">
│ │ │  <code class="sig-name descname">urljoin</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">url</span></em><span class="sig-paren">)</span><a class="reference internal" href="../_modules/scrapy/http/response.html#Response.urljoin"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.Response.urljoin" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Constructs an absolute url by combining the Response’s <a class="reference internal" href="#scrapy.http.Response.url" title="scrapy.http.Response.url"><code class="xref py py-attr docutils literal notranslate"><span class="pre">url</span></code></a> with
│ │ │  a possible relative url.</p>
│ │ │ -<p>This is a wrapper over <a class="reference external" href="https://docs.python.org/3/library/urllib.parse.html#urllib.parse.urljoin" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">urljoin()</span></code></a>, it’s merely an alias for
│ │ │ +<p>This is a wrapper over <a class="reference external" href="https://docs.python.org/3/library/urllib.parse.html#urllib.parse.urljoin" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">urljoin()</span></code></a>, it’s merely an alias for
│ │ │  making this call:</p>
│ │ │  <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">urllib</span><span class="o">.</span><span class="n">parse</span><span class="o">.</span><span class="n">urljoin</span><span class="p">(</span><span class="n">response</span><span class="o">.</span><span class="n">url</span><span class="p">,</span> <span class="n">url</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │ @@ -1060,15 +1060,15 @@
│ │ │  <div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.0: </span>The <em>flags</em> parameter.</p>
│ │ │  </div>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.http.Response.follow_all">
│ │ │ -<code class="sig-name descname">follow_all</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">urls</span></em>, <em class="sig-param"><span class="n">callback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">method</span><span class="o">=</span><span class="default_value">'GET'</span></em>, <em class="sig-param"><span class="n">headers</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">body</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cookies</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">meta</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">encoding</span><span class="o">=</span><span class="default_value">'utf-8'</span></em>, <em class="sig-param"><span class="n">priority</span><span class="o">=</span><span class="default_value">0</span></em>, <em class="sig-param"><span class="n">dont_filter</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="n">errback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cb_kwargs</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">flags</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span> &#x2192; Generator<span class="p">[</span>scrapy.http.request.Request<span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.9)">None</a><span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.9)">None</a><span class="p">]</span><a class="reference internal" href="../_modules/scrapy/http/response.html#Response.follow_all"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.Response.follow_all" title="Permalink to this definition">¶</a></dt>
│ │ │ +<code class="sig-name descname">follow_all</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">urls</span></em>, <em class="sig-param"><span class="n">callback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">method</span><span class="o">=</span><span class="default_value">'GET'</span></em>, <em class="sig-param"><span class="n">headers</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">body</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cookies</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">meta</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">encoding</span><span class="o">=</span><span class="default_value">'utf-8'</span></em>, <em class="sig-param"><span class="n">priority</span><span class="o">=</span><span class="default_value">0</span></em>, <em class="sig-param"><span class="n">dont_filter</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="n">errback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cb_kwargs</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">flags</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span> &#x2192; Generator<span class="p">[</span>scrapy.http.request.Request<span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.10)">None</a><span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.10)">None</a><span class="p">]</span><a class="reference internal" href="../_modules/scrapy/http/response.html#Response.follow_all"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.Response.follow_all" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><div class="versionadded">
│ │ │  <p><span class="versionmodified added">New in version 2.0.</span></p>
│ │ │  </div>
│ │ │  <p>Return an iterable of <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> instances to follow all links
│ │ │  in <code class="docutils literal notranslate"><span class="pre">urls</span></code>. It accepts the same arguments as <code class="docutils literal notranslate"><span class="pre">Request.__init__</span></code> method,
│ │ │  but elements of <code class="docutils literal notranslate"><span class="pre">urls</span></code> can be relative URLs or <a class="reference internal" href="link-extractors.html#scrapy.link.Link" title="scrapy.link.Link"><code class="xref py py-class docutils literal notranslate"><span class="pre">Link</span></code></a> objects,
│ │ │  not only absolute URLs.</p>
│ │ │ @@ -1093,15 +1093,15 @@
│ │ │  <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> class, which is meant to be used only for binary data,
│ │ │  such as images, sounds or any media file.</p>
│ │ │  <p><a class="reference internal" href="#scrapy.http.TextResponse" title="scrapy.http.TextResponse"><code class="xref py py-class docutils literal notranslate"><span class="pre">TextResponse</span></code></a> objects support a new <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method argument, in
│ │ │  addition to the base <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> objects. The remaining functionality
│ │ │  is the same as for the <a class="reference internal" href="#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> class and is not documented here.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>encoding</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – is a string which contains the encoding to use for this
│ │ │ +<dd class="field-odd"><p><strong>encoding</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – is a string which contains the encoding to use for this
│ │ │  response. If you create a <a class="reference internal" href="#scrapy.http.TextResponse" title="scrapy.http.TextResponse"><code class="xref py py-class docutils literal notranslate"><span class="pre">TextResponse</span></code></a> object with a string as
│ │ │  body, it will be converted to bytes encoded using this encoding. If
│ │ │  <em>encoding</em> is <code class="docutils literal notranslate"><span class="pre">None</span></code> (default), the encoding will be looked up in the
│ │ │  response headers and body instead.</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  <p><a class="reference internal" href="#scrapy.http.TextResponse" title="scrapy.http.TextResponse"><code class="xref py py-class docutils literal notranslate"><span class="pre">TextResponse</span></code></a> objects support the following attributes in addition
│ │ │ @@ -1186,15 +1186,15 @@
│ │ │  <code class="docutils literal notranslate"><span class="pre">response.xpath('//img/&#64;src')[0]</span></code></p></li>
│ │ │  </ul>
│ │ │  <p>See <a class="reference internal" href="../intro/tutorial.html#response-follow-example"><span class="std std-ref">A shortcut for creating Requests</span></a> for usage examples.</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.http.TextResponse.follow_all">
│ │ │ -<code class="sig-name descname">follow_all</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">urls</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">callback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">method</span><span class="o">=</span><span class="default_value">'GET'</span></em>, <em class="sig-param"><span class="n">headers</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">body</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cookies</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">meta</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">encoding</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">priority</span><span class="o">=</span><span class="default_value">0</span></em>, <em class="sig-param"><span class="n">dont_filter</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="n">errback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cb_kwargs</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">flags</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">css</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">xpath</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span> &#x2192; Generator<span class="p">[</span>scrapy.http.request.Request<span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.9)">None</a><span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.9)">None</a><span class="p">]</span><a class="reference internal" href="../_modules/scrapy/http/response/text.html#TextResponse.follow_all"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.TextResponse.follow_all" title="Permalink to this definition">¶</a></dt>
│ │ │ +<code class="sig-name descname">follow_all</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">urls</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">callback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">method</span><span class="o">=</span><span class="default_value">'GET'</span></em>, <em class="sig-param"><span class="n">headers</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">body</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cookies</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">meta</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">encoding</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">priority</span><span class="o">=</span><span class="default_value">0</span></em>, <em class="sig-param"><span class="n">dont_filter</span><span class="o">=</span><span class="default_value">False</span></em>, <em class="sig-param"><span class="n">errback</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">cb_kwargs</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">flags</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">css</span><span class="o">=</span><span class="default_value">None</span></em>, <em class="sig-param"><span class="n">xpath</span><span class="o">=</span><span class="default_value">None</span></em><span class="sig-paren">)</span> &#x2192; Generator<span class="p">[</span>scrapy.http.request.Request<span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.10)">None</a><span class="p">, </span><a class="reference external" href="https://docs.python.org/3/library/constants.html#None" title="(in Python v3.10)">None</a><span class="p">]</span><a class="reference internal" href="../_modules/scrapy/http/response/text.html#TextResponse.follow_all"><span class="viewcode-link">[source]</span></a><a class="headerlink" href="#scrapy.http.TextResponse.follow_all" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>A generator that produces <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> instances to follow all
│ │ │  links in <code class="docutils literal notranslate"><span class="pre">urls</span></code>. It accepts the same arguments as the <a class="reference internal" href="#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a>’s
│ │ │  <code class="docutils literal notranslate"><span class="pre">__init__</span></code> method, except that each <code class="docutils literal notranslate"><span class="pre">urls</span></code> element does not need to be
│ │ │  an absolute URL, it can be any of the following:</p>
│ │ │  <ul class="simple">
│ │ │  <li><p>a relative URL</p></li>
│ │ │  <li><p>a <a class="reference internal" href="link-extractors.html#scrapy.link.Link" title="scrapy.link.Link"><code class="xref py py-class docutils literal notranslate"><span class="pre">Link</span></code></a> object, e.g. the result of
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/selectors.html
│ │ │ @@ -260,15 +260,15 @@
│ │ │  <blockquote>
│ │ │  <div><ul class="simple">
│ │ │  <li><p><a class="reference external" href="https://www.crummy.com/software/BeautifulSoup/">BeautifulSoup</a> is a very popular web scraping library among Python
│ │ │  programmers which constructs a Python object based on the structure of the
│ │ │  HTML code and also deals with bad markup reasonably well, but it has one
│ │ │  drawback: it’s slow.</p></li>
│ │ │  <li><p><a class="reference external" href="https://lxml.de/">lxml</a> is an XML parsing library (which also parses HTML) with a pythonic
│ │ │ -API based on <a class="reference external" href="https://docs.python.org/3/library/xml.etree.elementtree.html#module-xml.etree.ElementTree" title="(in Python v3.9)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">ElementTree</span></code></a>. (lxml is not part of the Python standard
│ │ │ +API based on <a class="reference external" href="https://docs.python.org/3/library/xml.etree.elementtree.html#module-xml.etree.ElementTree" title="(in Python v3.10)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">ElementTree</span></code></a>. (lxml is not part of the Python standard
│ │ │  library.)</p></li>
│ │ │  </ul>
│ │ │  </div></blockquote>
│ │ │  <p>Scrapy comes with its own mechanism for extracting data. They’re called
│ │ │  selectors because they “select” certain parts of the HTML document specified
│ │ │  either by <a class="reference external" href="https://www.w3.org/TR/xpath/all/">XPath</a> or <a class="reference external" href="https://www.w3.org/TR/selectors">CSS</a> expressions.</p>
│ │ │  <p><a class="reference external" href="https://www.w3.org/TR/xpath/all/">XPath</a> is a language for selecting nodes in XML documents, which can also be
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/settings.html
│ │ │ @@ -343,15 +343,15 @@
│ │ │  <p>For a list of available built-in settings see: <a class="reference internal" href="#topics-settings-ref"><span class="std std-ref">Built-in settings reference</span></a>.</p>
│ │ │  <div class="section" id="designating-the-settings">
│ │ │  <span id="topics-settings-module-envvar"></span><h2>Designating the settings<a class="headerlink" href="#designating-the-settings" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>When you use Scrapy, you have to tell it which settings you’re using. You can
│ │ │  do this by using an environment variable, <code class="docutils literal notranslate"><span class="pre">SCRAPY_SETTINGS_MODULE</span></code>.</p>
│ │ │  <p>The value of <code class="docutils literal notranslate"><span class="pre">SCRAPY_SETTINGS_MODULE</span></code> should be in Python path syntax, e.g.
│ │ │  <code class="docutils literal notranslate"><span class="pre">myproject.settings</span></code>. Note that the settings module should be on the
│ │ │ -Python <a class="reference external" href="https://docs.python.org/3/tutorial/modules.html#tut-searchpath" title="(in Python v3.9)"><span class="xref std std-ref">import search path</span></a>.</p>
│ │ │ +Python <a class="reference external" href="https://docs.python.org/3/tutorial/modules.html#tut-searchpath" title="(in Python v3.10)"><span class="xref std std-ref">import search path</span></a>.</p>
│ │ │  </div>
│ │ │  <div class="section" id="populating-the-settings">
│ │ │  <span id="populating-settings"></span><h2>Populating the settings<a class="headerlink" href="#populating-the-settings" title="Permalink to this headline">¶</a></h2>
│ │ │  <p>Settings can be populated using different mechanisms, each of which having a
│ │ │  different precedence. Here is the list of them in decreasing order of
│ │ │  precedence:</p>
│ │ │  <blockquote>
│ │ │ @@ -529,21 +529,21 @@
│ │ │  <p>If the asyncio reactor is enabled (see <a class="reference internal" href="#std-setting-TWISTED_REACTOR"><code class="xref std std-setting docutils literal notranslate"><span class="pre">TWISTED_REACTOR</span></code></a>) this setting can be used to specify the
│ │ │  asyncio event loop to be used with it. Set the setting to the import path of the
│ │ │  desired asyncio event loop class. If the setting is set to <code class="docutils literal notranslate"><span class="pre">None</span></code> the default asyncio
│ │ │  event loop will be used.</p>
│ │ │  <p>If you are installing the asyncio reactor manually using the <a class="reference internal" href="#scrapy.utils.reactor.install_reactor" title="scrapy.utils.reactor.install_reactor"><code class="xref py py-func docutils literal notranslate"><span class="pre">install_reactor()</span></code></a>
│ │ │  function, you can use the <code class="docutils literal notranslate"><span class="pre">event_loop_path</span></code> parameter to indicate the import path of the event loop
│ │ │  class to be used.</p>
│ │ │ -<p>Note that the event loop class must inherit from <a class="reference external" href="https://docs.python.org/3/library/asyncio-eventloop.html#asyncio.AbstractEventLoop" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">asyncio.AbstractEventLoop</span></code></a>.</p>
│ │ │ +<p>Note that the event loop class must inherit from <a class="reference external" href="https://docs.python.org/3/library/asyncio-eventloop.html#asyncio.AbstractEventLoop" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">asyncio.AbstractEventLoop</span></code></a>.</p>
│ │ │  <div class="admonition caution">
│ │ │  <p class="admonition-title">Caution</p>
│ │ │  <p>Please be aware that, when using a non-default event loop
│ │ │  (either defined via <a class="reference internal" href="#std-setting-ASYNCIO_EVENT_LOOP"><code class="xref std std-setting docutils literal notranslate"><span class="pre">ASYNCIO_EVENT_LOOP</span></code></a> or installed with
│ │ │  <a class="reference internal" href="#scrapy.utils.reactor.install_reactor" title="scrapy.utils.reactor.install_reactor"><code class="xref py py-func docutils literal notranslate"><span class="pre">install_reactor()</span></code></a>), Scrapy will call
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/asyncio-eventloop.html#asyncio.set_event_loop" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">asyncio.set_event_loop()</span></code></a>, which will set the specified event loop
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/asyncio-eventloop.html#asyncio.set_event_loop" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">asyncio.set_event_loop()</span></code></a>, which will set the specified event loop
│ │ │  as the current loop for the current OS thread.</p>
│ │ │  </div>
│ │ │  </div>
│ │ │  <div class="section" id="bot-name">
│ │ │  <span id="std-setting-BOT_NAME"></span><span id="std:setting-BOT_NAME"></span><h3>BOT_NAME<a class="headerlink" href="#bot-name" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">'scrapybot'</span></code></p>
│ │ │  <p>The name of the bot implemented by this Scrapy project (also known as the
│ │ │ @@ -1020,23 +1020,23 @@
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">None</span></code></p>
│ │ │  <p>File name to use for logging output. If <code class="docutils literal notranslate"><span class="pre">None</span></code>, standard error will be used.</p>
│ │ │  </div>
│ │ │  <div class="section" id="log-format">
│ │ │  <span id="std-setting-LOG_FORMAT"></span><span id="std:setting-LOG_FORMAT"></span><h3>LOG_FORMAT<a class="headerlink" href="#log-format" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">'%(asctime)s</span> <span class="pre">[%(name)s]</span> <span class="pre">%(levelname)s:</span> <span class="pre">%(message)s'</span></code></p>
│ │ │  <p>String for formatting log messages. Refer to the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/logging.html#logrecord-attributes" title="(in Python v3.9)"><span class="xref std std-ref">Python logging documentation</span></a> for the qwhole
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/logging.html#logrecord-attributes" title="(in Python v3.10)"><span class="xref std std-ref">Python logging documentation</span></a> for the qwhole
│ │ │  list of available placeholders.</p>
│ │ │  </div>
│ │ │  <div class="section" id="log-dateformat">
│ │ │  <span id="std-setting-LOG_DATEFORMAT"></span><span id="std:setting-LOG_DATEFORMAT"></span><h3>LOG_DATEFORMAT<a class="headerlink" href="#log-dateformat" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">'%Y-%m-%d</span> <span class="pre">%H:%M:%S'</span></code></p>
│ │ │  <p>String for formatting date/time, expansion of the <code class="docutils literal notranslate"><span class="pre">%(asctime)s</span></code> placeholder
│ │ │  in <a class="reference internal" href="#std-setting-LOG_FORMAT"><code class="xref std std-setting docutils literal notranslate"><span class="pre">LOG_FORMAT</span></code></a>. Refer to the
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/datetime.html#strftime-strptime-behavior" title="(in Python v3.9)"><span class="xref std std-ref">Python datetime documentation</span></a> for the
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/datetime.html#strftime-strptime-behavior" title="(in Python v3.10)"><span class="xref std std-ref">Python datetime documentation</span></a> for the
│ │ │  whole list of available directives.</p>
│ │ │  </div>
│ │ │  <div class="section" id="log-formatter">
│ │ │  <span id="std-setting-LOG_FORMATTER"></span><span id="std:setting-LOG_FORMATTER"></span><h3>LOG_FORMATTER<a class="headerlink" href="#log-formatter" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <a class="reference internal" href="logging.html#scrapy.logformatter.LogFormatter" title="scrapy.logformatter.LogFormatter"><code class="xref py py-class docutils literal notranslate"><span class="pre">scrapy.logformatter.LogFormatter</span></code></a></p>
│ │ │  <p>The class to use for <a class="reference internal" href="logging.html#custom-log-formats"><span class="std std-ref">formatting log messages</span></a> for different actions.</p>
│ │ │  </div>
│ │ │ @@ -1393,18 +1393,18 @@
│ │ │  import path. Also installs the asyncio event loop with the specified import
│ │ │  path if the asyncio reactor is enabled</p>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <p>If a reactor is already installed,
│ │ │  <a class="reference internal" href="#scrapy.utils.reactor.install_reactor" title="scrapy.utils.reactor.install_reactor"><code class="xref py py-func docutils literal notranslate"><span class="pre">install_reactor()</span></code></a> has no effect.</p>
│ │ │  <p><code class="xref py py-meth docutils literal notranslate"><span class="pre">CrawlerRunner.__init__</span></code> raises
│ │ │ -<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> if the installed reactor does not match the
│ │ │ +<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> if the installed reactor does not match the
│ │ │  <a class="reference internal" href="#std-setting-TWISTED_REACTOR"><code class="xref std std-setting docutils literal notranslate"><span class="pre">TWISTED_REACTOR</span></code></a> setting; therfore, having top-level
│ │ │  <a class="reference external" href="https://twistedmatrix.com/documents/current/api/twisted.internet.reactor.html" title="(in Twisted v2.0)"><code class="xref py py-mod docutils literal notranslate"><span class="pre">reactor</span></code></a> imports in project files and imported
│ │ │ -third-party libraries will make Scrapy raise <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> when
│ │ │ +third-party libraries will make Scrapy raise <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> when
│ │ │  it checks which reactor is installed.</p>
│ │ │  <p>In order to use the reactor installed by Scrapy:</p>
│ │ │  <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">scrapy</span>
│ │ │  <span class="kn">from</span> <span class="nn">twisted.internet</span> <span class="kn">import</span> <span class="n">reactor</span>
│ │ │  
│ │ │  
│ │ │  <span class="k">class</span> <span class="nc">QuotesSpider</span><span class="p">(</span><span class="n">scrapy</span><span class="o">.</span><span class="n">Spider</span><span class="p">):</span>
│ │ │ @@ -1425,15 +1425,15 @@
│ │ │          <span class="k">for</span> <span class="n">quote</span> <span class="ow">in</span> <span class="n">response</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;div.quote&#39;</span><span class="p">):</span>
│ │ │              <span class="k">yield</span> <span class="p">{</span><span class="s1">&#39;text&#39;</span><span class="p">:</span> <span class="n">quote</span><span class="o">.</span><span class="n">css</span><span class="p">(</span><span class="s1">&#39;span.text::text&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">get</span><span class="p">()}</span>
│ │ │  
│ │ │      <span class="k">def</span> <span class="nf">stop</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
│ │ │          <span class="bp">self</span><span class="o">.</span><span class="n">crawler</span><span class="o">.</span><span class="n">engine</span><span class="o">.</span><span class="n">close_spider</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="s1">&#39;timeout&#39;</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │ -<p>which raises <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a>, becomes:</p>
│ │ │ +<p>which raises <a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a>, becomes:</p>
│ │ │  <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">scrapy</span>
│ │ │  
│ │ │  
│ │ │  <span class="k">class</span> <span class="nc">QuotesSpider</span><span class="p">(</span><span class="n">scrapy</span><span class="o">.</span><span class="n">Spider</span><span class="p">):</span>
│ │ │      <span class="n">name</span> <span class="o">=</span> <span class="s1">&#39;quotes&#39;</span>
│ │ │  
│ │ │      <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="n">args</span><span class="p">,</span> <span class="o">**</span><span class="n">kwargs</span><span class="p">):</span>
│ │ │ @@ -1457,15 +1457,15 @@
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>The default value of the <a class="reference internal" href="#std-setting-TWISTED_REACTOR"><code class="xref std std-setting docutils literal notranslate"><span class="pre">TWISTED_REACTOR</span></code></a> setting is <code class="docutils literal notranslate"><span class="pre">None</span></code>, which
│ │ │  means that Scrapy will not attempt to install any specific reactor, and the
│ │ │  default reactor defined by Twisted for the current platform will be used. This
│ │ │  is to maintain backward compatibility and avoid possible problems caused by
│ │ │  using a non-default reactor.</p>
│ │ │ -<p>For additional information, see <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/choosing-reactor.html" title="(in Twisted v20.3)"><span>Choosing a Reactor and GUI Toolkit Integration</span></a>.</p>
│ │ │ +<p>For additional information, see <a class="reference external" href="https://twistedmatrix.com/documents/current/core/howto/choosing-reactor.html" title="(in Twisted v21.2)"><span>Choosing a Reactor and GUI Toolkit Integration</span></a>.</p>
│ │ │  </div>
│ │ │  <div class="section" id="urllength-limit">
│ │ │  <span id="std-setting-URLLENGTH_LIMIT"></span><span id="std:setting-URLLENGTH_LIMIT"></span><h3>URLLENGTH_LIMIT<a class="headerlink" href="#urllength-limit" title="Permalink to this headline">¶</a></h3>
│ │ │  <p>Default: <code class="docutils literal notranslate"><span class="pre">2083</span></code></p>
│ │ │  <p>Scope: <code class="docutils literal notranslate"><span class="pre">spidermiddlewares.urllength</span></code></p>
│ │ │  <p>The maximum URL length to allow for crawled URLs. For more information about
│ │ │  the default value for this setting see: <a class="reference external" href="https://boutell.com/newfaq/misc/urllength.html">https://boutell.com/newfaq/misc/urllength.html</a></p>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/signals.html
│ │ │ @@ -452,15 +452,15 @@
│ │ │  <dd><p>Sent after a spider has been closed. This can be used to release per-spider
│ │ │  resources reserved on <a class="reference internal" href="#std-signal-spider_opened"><code class="xref std std-signal docutils literal notranslate"><span class="pre">spider_opened</span></code></a>.</p>
│ │ │  <p>This signal supports returning deferreds from its handlers.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>spider</strong> (<a class="reference internal" href="spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> object) – the spider which has been closed</p></li>
│ │ │ -<li><p><strong>reason</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.9)"><em>str</em></a>) – a string which describes the reason why the spider was closed. If
│ │ │ +<li><p><strong>reason</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#str" title="(in Python v3.10)"><em>str</em></a>) – a string which describes the reason why the spider was closed. If
│ │ │  it was closed because the spider has completed scraping, the reason
│ │ │  is <code class="docutils literal notranslate"><span class="pre">'finished'</span></code>. Otherwise, if the spider was manually closed by
│ │ │  calling the <code class="docutils literal notranslate"><span class="pre">close_spider</span></code> engine method, then the reason is the one
│ │ │  passed in the <code class="docutils literal notranslate"><span class="pre">reason</span></code> argument of that method (which defaults to
│ │ │  <code class="docutils literal notranslate"><span class="pre">'cancelled'</span></code>). If the engine was shutdown (for example, by hitting
│ │ │  Ctrl-C to stop it) the reason will be <code class="docutils literal notranslate"><span class="pre">'shutdown'</span></code>.</p></li>
│ │ │  </ul>
│ │ │ @@ -634,15 +634,15 @@
│ │ │  times for the same request, with partial data each time. For instance,
│ │ │  a possible scenario for a 25 kb response would be two signals fired
│ │ │  with 10 kb of data, and a final one with 5 kb of data.</p>
│ │ │  <p>This signal does not support returning deferreds from its handlers.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │ -<li><p><strong>data</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.9)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> object) – the data received by the download handler</p></li>
│ │ │ +<li><p><strong>data</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#bytes" title="(in Python v3.10)"><code class="xref py py-class docutils literal notranslate"><span class="pre">bytes</span></code></a> object) – the data received by the download handler</p></li>
│ │ │  <li><p><strong>request</strong> (<a class="reference internal" href="request-response.html#scrapy.http.Request" title="scrapy.http.Request"><code class="xref py py-class docutils literal notranslate"><span class="pre">Request</span></code></a> object) – the request that generated the download</p></li>
│ │ │  <li><p><strong>spider</strong> (<a class="reference internal" href="spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> object) – the spider associated with the response</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/spider-middleware.html
│ │ │ @@ -349,15 +349,15 @@
│ │ │  kicks in, starting from the next spider middleware, and no other
│ │ │  <a class="reference internal" href="#scrapy.spidermiddlewares.SpiderMiddleware.process_spider_exception" title="scrapy.spidermiddlewares.SpiderMiddleware.process_spider_exception"><code class="xref py py-meth docutils literal notranslate"><span class="pre">process_spider_exception()</span></code></a> will be called.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>response</strong> (<a class="reference internal" href="request-response.html#scrapy.http.Response" title="scrapy.http.Response"><code class="xref py py-class docutils literal notranslate"><span class="pre">Response</span></code></a> object) – the response being processed when the exception was
│ │ │  raised</p></li>
│ │ │ -<li><p><strong>exception</strong> (<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.9)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> object) – the exception raised</p></li>
│ │ │ +<li><p><strong>exception</strong> (<a class="reference external" href="https://docs.python.org/3/library/exceptions.html#Exception" title="(in Python v3.10)"><code class="xref py py-exc docutils literal notranslate"><span class="pre">Exception</span></code></a> object) – the exception raised</p></li>
│ │ │  <li><p><strong>spider</strong> (<a class="reference internal" href="spiders.html#scrapy.spiders.Spider" title="scrapy.spiders.Spider"><code class="xref py py-class docutils literal notranslate"><span class="pre">Spider</span></code></a> object) – the spider which raised the exception</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/spiders.html
│ │ │ @@ -367,16 +367,16 @@
│ │ │  <p>Nonetheless, this method sets the <a class="reference internal" href="#scrapy.spiders.Spider.crawler" title="scrapy.spiders.Spider.crawler"><code class="xref py py-attr docutils literal notranslate"><span class="pre">crawler</span></code></a> and <a class="reference internal" href="#scrapy.spiders.Spider.settings" title="scrapy.spiders.Spider.settings"><code class="xref py py-attr docutils literal notranslate"><span class="pre">settings</span></code></a>
│ │ │  attributes in the new instance so they can be accessed later inside the
│ │ │  spider’s code.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │  <dd class="field-odd"><ul class="simple">
│ │ │  <li><p><strong>crawler</strong> (<a class="reference internal" href="api.html#scrapy.crawler.Crawler" title="scrapy.crawler.Crawler"><code class="xref py py-class docutils literal notranslate"><span class="pre">Crawler</span></code></a> instance) – crawler to which the spider will be bound</p></li>
│ │ │ -<li><p><strong>args</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.9)"><em>list</em></a>) – arguments passed to the <code class="xref py py-meth docutils literal notranslate"><span class="pre">__init__()</span></code> method</p></li>
│ │ │ -<li><p><strong>kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – keyword arguments passed to the <code class="xref py py-meth docutils literal notranslate"><span class="pre">__init__()</span></code> method</p></li>
│ │ │ +<li><p><strong>args</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#list" title="(in Python v3.10)"><em>list</em></a>) – arguments passed to the <code class="xref py py-meth docutils literal notranslate"><span class="pre">__init__()</span></code> method</p></li>
│ │ │ +<li><p><strong>kwargs</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – keyword arguments passed to the <code class="xref py py-meth docutils literal notranslate"><span class="pre">__init__()</span></code> method</p></li>
│ │ │  </ul>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  <dl class="py method">
│ │ │  <dt id="scrapy.spiders.Spider.start_requests">
│ │ │ @@ -535,15 +535,15 @@
│ │ │          <span class="k">yield</span> <span class="n">scrapy</span><span class="o">.</span><span class="n">Request</span><span class="p">(</span><span class="sa">f</span><span class="s1">&#39;http://www.example.com/categories/</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">category</span><span class="si">}</span><span class="s1">&#39;</span><span class="p">)</span>
│ │ │  </pre></div>
│ │ │  </div>
│ │ │  <p>Keep in mind that spider arguments are only strings.
│ │ │  The spider will not do any parsing on its own.
│ │ │  If you were to set the <code class="docutils literal notranslate"><span class="pre">start_urls</span></code> attribute from the command line,
│ │ │  you would have to parse it on your own into a list
│ │ │ -using something like <a class="reference external" href="https://docs.python.org/3/library/ast.html#ast.literal_eval" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">ast.literal_eval()</span></code></a> or <a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a>
│ │ │ +using something like <a class="reference external" href="https://docs.python.org/3/library/ast.html#ast.literal_eval" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">ast.literal_eval()</span></code></a> or <a class="reference external" href="https://docs.python.org/3/library/json.html#json.loads" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">json.loads()</span></code></a>
│ │ │  and then set it as an attribute.
│ │ │  Otherwise, you would cause iteration over a <code class="docutils literal notranslate"><span class="pre">start_urls</span></code> string
│ │ │  (a very common python pitfall)
│ │ │  resulting in each character being seen as a separate url.</p>
│ │ │  <p>A valid use case is to set the http auth credentials
│ │ │  used by <a class="reference internal" href="downloader-middleware.html#scrapy.downloadermiddlewares.httpauth.HttpAuthMiddleware" title="scrapy.downloadermiddlewares.httpauth.HttpAuthMiddleware"><code class="xref py py-class docutils literal notranslate"><span class="pre">HttpAuthMiddleware</span></code></a>
│ │ │  or the user agent
│ │ ├── ./usr/share/doc/python-scrapy-doc/html/topics/telnetconsole.html
│ │ │ @@ -322,15 +322,15 @@
│ │ │  <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">est</span></code></p></td>
│ │ │  <td><p>print a report of the engine status</p></td>
│ │ │  </tr>
│ │ │  <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">prefs</span></code></p></td>
│ │ │  <td><p>for memory debugging (see <a class="reference internal" href="leaks.html#topics-leaks"><span class="std std-ref">Debugging memory leaks</span></a>)</p></td>
│ │ │  </tr>
│ │ │  <tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">p</span></code></p></td>
│ │ │ -<td><p>a shortcut to the <a class="reference external" href="https://docs.python.org/3/library/pprint.html#pprint.pprint" title="(in Python v3.9)"><code class="xref py py-func docutils literal notranslate"><span class="pre">pprint.pprint()</span></code></a> function</p></td>
│ │ │ +<td><p>a shortcut to the <a class="reference external" href="https://docs.python.org/3/library/pprint.html#pprint.pprint" title="(in Python v3.10)"><code class="xref py py-func docutils literal notranslate"><span class="pre">pprint.pprint()</span></code></a> function</p></td>
│ │ │  </tr>
│ │ │  <tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">hpy</span></code></p></td>
│ │ │  <td><p>for memory debugging (see <a class="reference internal" href="leaks.html#topics-leaks"><span class="std std-ref">Debugging memory leaks</span></a>)</p></td>
│ │ │  </tr>
│ │ │  </tbody>
│ │ │  </table>
│ │ │  </div>
│ │ │ @@ -392,15 +392,15 @@
│ │ │  <code class="sig-prename descclassname">scrapy.extensions.telnet.</code><code class="sig-name descname">update_telnet_vars</code><span class="sig-paren">(</span><em class="sig-param"><span class="n">telnet_vars</span></em><span class="sig-paren">)</span><a class="headerlink" href="#scrapy.extensions.telnet.update_telnet_vars" title="Permalink to this definition">¶</a></dt>
│ │ │  <dd><p>Sent just before the telnet console is opened. You can hook up to this
│ │ │  signal to add, remove or update the variables that will be available in the
│ │ │  telnet local namespace. In order to do that, you need to update the
│ │ │  <code class="docutils literal notranslate"><span class="pre">telnet_vars</span></code> dict in your handler.</p>
│ │ │  <dl class="field-list simple">
│ │ │  <dt class="field-odd">Parameters</dt>
│ │ │ -<dd class="field-odd"><p><strong>telnet_vars</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.9)"><em>dict</em></a>) – the dict of telnet variables</p>
│ │ │ +<dd class="field-odd"><p><strong>telnet_vars</strong> (<a class="reference external" href="https://docs.python.org/3/library/stdtypes.html#dict" title="(in Python v3.10)"><em>dict</em></a>) – the dict of telnet variables</p>
│ │ │  </dd>
│ │ │  </dl>
│ │ │  </dd></dl>
│ │ │  
│ │ │  </div>
│ │ │  <div class="section" id="telnet-settings">
│ │ │  <h2>Telnet settings<a class="headerlink" href="#telnet-settings" title="Permalink to this headline">¶</a></h2>