# 导入模块
import requests
import csv
from bs4 import BeautifulSoup
for page in range(1, 2):
url = f'https://wh.lianjia.com/ershoufang/pg{page}/'
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.75 Safari/537.36'
}
# 发送请求,获取回应
response = requests.get(url, headers=headers)
# 从响应中获取数据
print(response.text)
print('****************')
html = response.text
soup = BeautifulSoup(html, features="lxml")
print(soup)
# 数据提取
infos = soup.find('ul', {'class': 'sellListContent'}).find_all('li')
print(infos)
for info in infos:
title = info.find('div', {'class': 'title'}).find('a').get_text()
print(title)
totalprice = info.find('div', {'class': 'priceInfo'}).find('div', {'class': 'totalPrice totalPrice2'}).find('span').get_text()+"万"
print(totalprice)
unitprice = info.find('div', {'class': 'priceInfo'}).find('div', {'class': 'unitPrice'}).find('span').get_text()
unitprice.replace(",", "")
print(unitprice)
imformation = info.find('div', {'class': 'houseInfo'}).get_text()
print(imformation)
address = info.find('div', {'class': 'flood'}).find('div', {'class': 'positionInfo'}).find('a').get_text()
print(address)
f = open(r'F:\爬虫\lianjia\lianjia.csv', 'w', encoding='utf-8-sig', newline="")
csv_write = csv.writer(f)
csv_write.writerow(['title', 'totalprice', 'unitprice', 'imformation', 'address'])
我就写入表头,后面不知道怎么写了,请解答一下,谢谢
csv_write.writerow(title,totalprice,unitprice,imformation,address)