issue GH #1550 - scrapy shell argument fixes: "example.com" requests "http://example.com"; "example" requests "file://example"; "./example.com" requests "file://example.com"

2025-02-28 17:57:55 +00:00 · 2015-11-02 16:08:19 +03:00 · 2015-11-02 16:08:19 +03:00 · bc9db65358
commit bc9db65358
parent a41c64bfb9
1 changed files with 12 additions and 1 deletions
--- a/scrapy/commands/shell.py
+++ b/scrapy/commands/shell.py
@ -5,11 +5,13 @@ See documentation in docs/topics/shell.rst
 """
 from threading import Thread
 import urlparse
 from w3lib.url import any_to_uri
 from scrapy.commands import ScrapyCommand
 from scrapy.shell import Shell
 from scrapy.http import Request
 from scrapy.utils.url import add_http_if_no_scheme
 from scrapy.utils.spider import spidercls_for_request, DefaultSpider
@ -43,8 +45,17 @@ class Command(ScrapyCommand):
    def run(self, args, opts):
        url = args[0] if args else None
        if url:
            parts = urlparse.urlsplit(url)
            if not parts.scheme:
                if "." not in parts.path.split("/", 1)[0]:
                    url = any_to_uri(url)
                for pattern in ["/", "./", "../"]:
                    if url.startswith(pattern):
                        url = any_to_uri(url)
                        break
                url = add_http_if_no_scheme(url)
        spider_loader = self.crawler_process.spider_loader
        spidercls = DefaultSpider