class BooksSpider(scrapy.Spider):
# start_urls = ['http://books.toscrape.com/']
# 实现start_requests 方法, 替代start_urls类属性
def start_requests(self):
yield scrapy.Request('http://books.toscrape.com/', 1 callback=self.parse_book,
headers={'User-Agent': 'Mozilla/5.0'}, 2 dont_filter=True)
# 改用parse_book 作为回调函数
def parse_book(response):
...