import requests
from lxml import etree
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36"}
url = "https://www.qiushibaike.com/text/"
response = requests.get(url,headers = headers)
selector = etree.HTML(response.text)
result = selector.xpath('//*[@id="qiushi_tag_121225349"]/a[1]/div/span/text()')
print(result)
调试看下
response = requests.get(url,headers = headers)
这里如果有结果,说明抓取是正确的,否则是错误的,如果错误,抓包看下请求、url
如果html获取正确,检查result = selector.xpath('//*[@id="qiushi_tag_121225349"]/a[1]/div/span/text()')
一层一层来,首先看[@id="qiushi_tag_121225349"] 这个有没有
然后看a有没有,div,span...