Add deprecation warning to HtmlParserLinkExtractor

2025-02-27 07:03:55 +00:00 · 2015-05-04 17:11:05 -03:00 · 2015-05-04 17:11:05 -03:00 · 389f6e95c5
commit 389f6e95c5
parent d00e43f39c
1 changed files with 9 additions and 0 deletions
--- a/scrapy/linkextractors/htmlparser.py
+++ b/scrapy/linkextractors/htmlparser.py
@ -2,6 +2,7 @@
 HTMLParser-based link extractor
 """
 import warnings
 from HTMLParser import HTMLParser
 from six.moves.urllib.parse import urljoin
@ -9,12 +10,20 @@ from w3lib.url import safe_url_string
 from scrapy.link import Link
 from scrapy.utils.python import unique as unique_list
 from scrapy.exceptions import ScrapyDeprecationWarning
 class HtmlParserLinkExtractor(HTMLParser):
    def __init__(self, tag="a", attr="href", process=None, unique=False):
        HTMLParser.__init__(self)
        warnings.warn(
            "HtmlParserLinkExtractor is deprecated and will be removed in "
            "future releases. Please use scrapy.linkextractors.LinkExtractor",
            ScrapyDeprecationWarning
        )
        self.scan_tag = tag if callable(tag) else lambda t: t == tag
        self.scan_attr = attr if callable(attr) else lambda a: a == attr
        self.process_attr = process if callable(process) else lambda v: v