from urllib import request
from bs4 import BeautifulSoup
import requests
import re
from fake_useragent import UserAgent
req_header= {'User-Agent':str(UserAgent().random)}
def getHTMLText(url):
try:
r = requests.get(url,timeout=30,headers = req_header)
r.raise_for_status() #如果不是200,产生异常requests.HTTPError
r.encoding = r.apparent_encoding
return r.text
except:
return "产生异常"
url_zhangjie = 'www.qq.com'
url_neirong = getHTMLText(url_zhangjie)
print(url_neirong)
产生异常
http协议都没加