我試圖使用python和Scrapy從Subway UK Restaurant Finder中刮取商店位置數據。我已經設法抓取單個頁面,但是我想設置它來遍歷鏈接末尾的1000個遞歸標識列表。任何幫助,將不勝感激。使用Scrapy刮取遞歸頁面數據
免責聲明:我不知道我在做什麼
from scrapy.spider import BaseSpider
from scrapy.selector import HtmlXPathSelector
from subway.items import SubwayFinder
class MySpider(BaseSpider):
name = "subway"
allowed_domains = ["http://www.subway.co.uk/"]
start_urls = ["http://www.subway.co.uk/business/storefinder/store-detail.aspx?id=453056039"]
def parse(self, response):
hxs = HtmlXPathSelector(response)
titles = hxs.select("//div[@class='mid']")
items = []
for titles in titles:
item = SubwayFinder()
item ["title"] = titles.select("p/span/text()").extract()
items.append(item)
return items