import re
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
url = "http://www.aiimg.com/"
res = requests.get(url=url,headers=headers).encode=("utf-8")
response = res.encode('utf-8')
print(response)
img_url = re.findall(r'.+?print(img_url)
for photos in img_url:
print(photos)
photo_response = requests.get(url=photos,headers=headers).content
for photo in photo_response:
for numbers in range(1,len(img_url)):
with open("imgs_"+str(numbers)+".jpg","wb") as fp:
fp.write(photo_response)
print("OK")
解决方法
获取到的数据是需要解码的:gb2312
解码。
所以,
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
url = "http://www.aiimg.com/"
res = requests.get(url=url, headers=headers)
response = res.content.decode('gb2312')
print(response)
- 2、下面的图片修改为:
photo_response = requests.get(url=photos,headers=headers).content.decode('gb2312')
```
如有问题及时沟通
前面的代码应该是:
import requests
import re
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
url = "http://www.aiimg.com/"
res = requests.get(url=url,headers=headers)
img_url = re.findall(r'src="(.*?)"', res.text)
img_url = [i for i in img_url if i.startswith('http')]
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
url = "http://www.aiimg.com/"
res = requests.get(url=url,headers=headers)
res.encoding = res.apparent_encoding
print(res.text)
搜索官网运用别人模板