帮忙看看什么错误
import re
from idlelib.iomenu import encoding
import csv
import requests
from bs4 import BeautifulSoup
import time
import pandas as pd
import xlwt
import chardet
dm_data = [] # 弹幕数据
dm_text = [] # 弹幕本体
# 弹幕的八个参数和弹幕本体
DM_hour = []
DM_time = []
DM_mode = []
DM_font = []
DM_color = []
DM_realTime = []
DM_pool = []
DM_userID = []
DM_id = []
DM_text = []
url="https://www.bilibili.com/video/BV1bL4y1V7q1?p=25&spm_id_from=333.337.top_right_bar_window_history.content.click&vd_source=7e680828c89d6c219caf0d8b6c63b41b"
headers={
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:102.0) Gecko/20100101 Firefox/102.0"
}
resp=requests.get(url,headers=headers)
page_content=resp.text
obj=re.compile(r'{"cid":(?P<lzs>.*?),',re.S)
result=obj.finditer(page_content)
f=open("data.csv",mode='w',encoding='utf8')
csvwriter=csv.writer(f)
for it in result:
cid=it.group("lzs")
url = f'https://comment.bilibili.com/{cid}.xml'
response = requests.get(url)
response.encoding=response.apparent_encoding
page_content = response.text
soup = BeautifulSoup(page_content, 'lxml')
all = soup.find_all("d")
for d in all:
# 弹幕数据
dm_data.append(str(d.get("p")).split(","))
# 弹幕本体
dm_text.append(d.get_text())
for i in dm_data:
a=i[4]
time_local = time.localtime(int(a))
dt = time.strftime("%Y-%m-%d %H:%M:%S", time_local)
i[4]=dt
DM_time.append(i[0])
DM_mode.append(i[1])
DM_font.append(i[2])
DM_color.append(i[3])
DM_realTime.append(i[4])
DM_pool.append(i[5])
DM_userID.append(i[6])
DM_id.append(i[7])
for a in dm_text:
DM_text.append(a)
dt={"DM_time":DM_time,"DM_mode":DM_mode,"DM_font":DM_font,"DM_color":DM_color,
"DM_realTime":DM_realTime,"DM_pool":DM_pool,"DM_userID":DM_userID,"DM_id":DM_id,"DM_text":DM_text}
d=pd.DataFrame(dt)
d.to_csv('C:\\Users\\86151\\PycharmProjects\\pythonProject\\1.csv',encoding='utf-8-sig') #存储弹幕信息
print("over!")
在错误处打个断点,然后看看即将发生错误前的时候,各个变量的数值是什么。
代码有些长,建议加断点测试