import re
import requests
url = "https://www.xbiquge.la/"
def getbook(url):
dic = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.101 Safari/537.36 Edg/91.0.864.48"
}
get_url =requests.get(url,headers=dic)
get_url.encoding='utf-8'
page_content = get_url.text
obj =re.compile(
r'<div class="item">.*?<span>(?P<name>.*?)</span>'
r'<a href="(?P<href>.*?)">'
r'(?P<shuming>.*?)</a></dt>.*?'
r'<dd>(?P<jieshao>.*?)</dd>',re.S)
result =obj.findall(page_content)
for it in result:
print(it)
print(it.group("name"))#这里用不了group
getbook(url)
import re
import requests
url = "https://www.xbiquge.la/"
def getbook(url):
dic = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.101 Safari/537.36 Edg/91.0.864.48"
}
get_url =requests.get(url,headers=dic)
get_url.encoding='utf-8'
page_content = get_url.text
obj =re.compile(
r'<div class="item">.*?<span>(?P<name>.*?)</span>'
r'<a href="(?P<href>.*?)">'
r'(?P<shuming>.*?)</a></dt>.*?'
r'<dd>(?P<jieshao>.*?)</dd>',re.S)
result =obj.findall(page_content)
for it in result:
print(it)
print(re.search(obj,page_content).group("name"))
getbook(url)
group不能对元组用
您好,我是有问必答小助手,您的问题已经有小伙伴解答了,您看下是否解决,可以追评进行沟通哦~
如果有您比较满意的答案 / 帮您提供解决思路的答案,可以点击【采纳】按钮,给回答的小伙伴一些鼓励哦~~
ps: 问答会员年卡【8折】购 ,限时加赠IT实体书,即可 享受50次 有问必答服务,了解详情>>>https://t.csdnimg.cn/RW5m