问题代码:
bs4_data = BeautifulSoup(data,'lxml') book_list = bs4_data.select('.book-name') for book in book_list: book_dic = {} book_dic['book_name'] = book.select('.book-name').get_text() print(book_dic)
把.get_text()去掉后能输出空列表
from bs4 import BeautifulSoup
# 假设你已经有了 'data' 变量,其中包含了网页的 HTML 数据
bs4_data = BeautifulSoup(data, 'lxml')
book_list = bs4_data.select('.book-name')
for book in book_list:
book_dic = {}
book_name = book.get_text() # 获取书名文本
book_dic['book_name'] = book_name
print(book_dic)