start_urls = [
def parse(self, response):
shop_title = self.getShopTitle(response)
sell_count = self.getSellCount(response)
self.shopParser(response, shop_title, sell_count)
def shopParser(self, response, shop_title, sell_count):
items = EbayItem()
items['shop_title'] = shop_title
items['sell_count'] = sell_count
if sell_count > 0:
item_links = response.xpath('//ul[@id="ListViewInner"]/li/h3/a/@href').extract()
for link in item_links:
items['item_price'] = response.xpath('//span[@itemprop="price"]/text()').extract_first()
yield items
答案 0 :(得分:1)
SELECT json_group_array(json_object('rank', rank
, 'name', name
, 'director', director
, 'year', year
, 'rating', rating
, 'starring', starring))
FROM movies;
这些新请求也将通过def parse(self, response):
shop_title = response.meta.get('shop_title', self.getShopTitle(response))
sell_count = response.meta.get('sell_count', self.getSellCount(response))
# here you logic with item parsing
if sell_count > 0:
item_links = response.xpath('//ul[@id="ListViewInner"]/li/h3/a/@href').extract()
# yield requests to next pages
for link in item_links:
yield scrapy.Request(response.urljoin(link), meta={'shop_title': shop_title, 'sell_count': sell_count})