import re
import requests
url = "https://movie.douban.com/j/chart/top_list?type=11&interval_id=100%3A90&action=&start=0&limit=1"
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/106.0.0.0 Safari/537.36"
}
# 拿到第二次请求的源代码
reap = requests.get(url=url,headers=headers)
page_countent = reap.text #页面源代码
print(page_countent)
obj = re.compile(r'"id":"1292052","types":["犯罪","剧情"],"regions":["美国"],"title":"肖申克的救赎"',re.S)
it = obj.finditer(page_countent)
for i in it:
print(i.group())
[]在正则中是有特殊含义的,你要匹配[]的话,要加转义符号。
obj = re.compile(r'"id":"1292052","types":\["犯罪","剧情"\],"regions":\["美国"\],"title":"肖申克的救赎"', re.S)