Web scraping Scrapy init返回一个None
我有一本潦草的手稿Web scraping Scrapy init返回一个None,web-scraping,scrapy,web-crawler,scrapy-pipeline,Web Scraping,Scrapy,Web Crawler,Scrapy Pipeline,我有一本潦草的手稿 class QuotesSpider(scrapy.Spider): name = 'quotes' def __init__(self, *args, **kwargs): super(QuotesSpider, self).__init__(*args, **kwargs) self.cat = [kwargs.get('cat')] print(self.cat) def start_requests(self): #print(s
class QuotesSpider(scrapy.Spider):
name = 'quotes'
def __init__(self, *args, **kwargs):
super(QuotesSpider, self).__init__(*args, **kwargs)
self.cat = [kwargs.get('cat')]
print(self.cat)
def start_requests(self):
#print(self.params)
urls = ['https://google.com/html/?q=a%v%c']
for url in urls:
yield scrapy.Request(url=url, callback=self.parse)
在命令行上:
scrapy crawl quotes -a cat="avc"
当我运行命令时:
它打印“无”
如何访问程序中通过命令行传递的值“avc”代码中缺少一些内容。查看下面的示例代码
class QuotesSpider(scrapy.Spider):
name = 'quotes'
def __init__(self, *args, **kwargs):
super(QuotesSpider, self).__init__(*args, **kwargs)
self.cat = kwargs.get('cat')
print(self.cat)
def start_requests(self):
# print(self.params)
urls = [f"https://www.google.com/search?q={self.cat}"]
# urls = ['https://google.com/html/?q=a%v%c']
for url in urls:
yield scrapy.Request(url=url, callback=self.parse)
def parse(self, response):
print(response, "Response <---")
class QuotesSpider(scrapy.Spider):
名称='quotes'
定义初始化(self,*args,**kwargs):
super(QuotesSpider,self)。uuu init_uuuu(*args,**kwargs)
self.cat=kwargs.get('cat'))
打印(self.cat)
def start_请求(自我):
#打印(self.params)
URL=[f”https://www.google.com/search?q={self.cat}“]
#URL=['https://google.com/html/?q=a%v%c']
对于url中的url:
生成scrapy.Request(url=url,callback=self.parse)
def解析(自我,响应):
打印(响应,“响应
<200 https://www.google.com/search?q=avc> Response <---