li_list = tree.xpath('//div[@class="figure-result"]/ul/li') #这是我写的,我print(li_list)都是空的,请大神指点下
import requests
from lxml import etree
import os
if __name__ == "__main__":
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.125 Safari/537.36'
} # 伪装成浏览器,将headers设置成浏览器中设置的值
num = 0
num_1 = 0
num_2 = 0
x=2
if not os.path.exists('./picLibs'):
os.mkdir('./picLibs')
for i in range(int(x)):
url = 'https://pic.sogou.com/pics?query='+'橘子皮'
page_text = requests.get(url=url, headers=headers).text
tree = etree.HTML(page_text)
li_list = tree.xpath('//div[@class="figure-result"]/ul/li')
print(li_list)
你把page_text打印输出下看看,获取的html源码中没有那个图片数据,说明那块图片数据是动态加载的,你可能需要换种方式获取,比如使用selenium。望采纳!