用scrapy-splash爬取网站 为啥iframe下的内容没有被返回?
import scrapy
from scrapy import Selector
class Music163Spider(scrapy.Spider):
name = "music163"
allowed_domains = ["music.163.com/#/discover/toplist"]
start_urls = ['http://music.163.com/#/discover/toplist/']
def parse(self, response):
print("parse:",response.text)
def start_requests(self):
for url in self.start_urls:
yield scrapy.Request(url, self.parse, meta={
'splash': {
'endpoint': 'render.html',
'args': {
'wait': 0.5,
}
}
})
你需要在parse中获取iframe的url再次请求内容。