From 142367a5f0499352fff991ab3bd5cb6b3d772bd0 Mon Sep 17 00:00:00 2001 From: Seven2Nine <61679388+Seven2Nine@users.noreply.github.com> Date: Wed, 8 Jul 2020 11:06:52 +0800 Subject: [PATCH] Update spider.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 修复“//” 开头的url报错 ValueError('Missing scheme in request url: %s' % self._url) --- backend/template/scrapy/config_spider/spiders/spider.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backend/template/scrapy/config_spider/spiders/spider.py b/backend/template/scrapy/config_spider/spiders/spider.py index d87f4297..09dfdf5e 100644 --- a/backend/template/scrapy/config_spider/spiders/spider.py +++ b/backend/template/scrapy/config_spider/spiders/spider.py @@ -9,7 +9,7 @@ def get_real_url(response, url): return url elif re.search(r'^\/\/', url): u = urlparse(response.url) - return u.scheme + url + return u.scheme + ":" + url return urljoin(response.url, url) class ConfigSpider(scrapy.Spider):