我想在这个网页上抓取产品的名称,但我得到一个空列表。我将 splash 用于动态网页,但结果是一样的。有人可以告诉我该怎么做吗?任何其他解决方案?
这是我要抓取的网页:https ://www.woolworths.com.au/shop/browse/drinks/cordias-juices-iced-teas/iced-teas
import scrapy
from shop.items import ShopItem
from scrapy_splash import SplashRequest
class Spider(scrapy.Spider) :
name = 'productsspider'
start_urls = ['https://www.woolworths.com.au/shop/browse/drinks/cordials-juices-iced-teas/iced-teas']
def start_requests(self):
for url in self.start_urls:
yield SplashRequest(url=url, callback=self.parse, args={"wait":3})
def parse(self, response):
item = ShopItem()
for p in response.css(".divng-tns-c32-15 product-grid.ng-trigger.ng-trigger-staggerFadeInOut"):
item = productsItem()
item["product_name"] = p.css(".ng-tns-c32-15.product-grid--tile.ng-star-inserted .ng-tns-c32-15.product-grid--tile.ng-star-inserted shared-product-tile section .shelfProductTile-content div header a::text").extract()
yield item