#在尝试输出网页源代码时发现和浏览器的源代码不一样,
import requests
import re
headers={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36 Edg/100.0.1185.50'
}
img=requests.get('https://image.baidu.com/search/detail?ct=503316480&z=0&ipn=d&word=%E7%8C%AB%CD%BC%C6%AC&step_word=&hs=0&pn=0&spn=0&di=7060663421280190465&pi=0&rn=1&tn=baiduimagedetail&is=0%2C0&istype=0&ie=utf-8&oe=utf-8&in=&cl=2&lm=-1&st=undefined&cs=2015190072%2C782484968&os=3153987117%2C2448907738&simid=3382994032%2C357120187&adpicid=0&lpn=0&ln=1912&fr=&fmq=1650424609892_R&fm=&ic=undefined&s=undefined&hd=undefined&latest=undefined©right=undefined&se=&sme=&tab=0&width=undefined&height=undefined&face=undefined&ist=&jit=&cg=&bdtype=0&oriquery=&objurl=https%3A%2F%2Fgimg2.baidu.com%2Fimage_search%2Fsrc%3Dhttp%3A%2F%2Fhbimg.b0.upaiyun.com%2F9278ce7ab85990a604efb8d0ac01a5176b4a1bff1d28b0-ZjZ6xa_fw658%26refer%3Dhttp%3A%2F%2Fhbimg.b0.upaiyun.com%26app%3D2002%26size%3Df9999%2C10000%26q%3Da80%26n%3D0%26g%3D0n%26fmt%3Dauto%3Fsec%3D1653017059%26t%3Dfb87f85b3147cbc6d2b1f49ad7c0ea4f&fromurl=ippr_z2C%24qAzdH3FAzdH3Fi7wkwg_z%26e3Bv54AzdH3FrtgfAzdH3F89ldanacbbAzdH3F&gsm=2&rpstart=0&rpnum=0&islist=&querylist=&nojc=undefined&dyTabStr=MCwzLDIsMSw2LDQsNSw3LDgsOQ%3D%3D',headers=headers)
ret=re.match("{https://img/d/.baidu/.comu=[0,9]*[0,9]*}+","src")
print (img.text)
我就想检索出图片信息,可在输出的源代码中没有找到浏览器网页的原图片码。
有两种方式,第一用浏览器打开,第二,用渲染的插件