import requests
from retrying import retry
# 专门请求URL地址的方法
header1 = {"User-Agent": "Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/72.0.3626.121 Safari/537.36"} #文件头 User-Agent部分
# 让装饰的函数反复执行3次,三次全部报错才会报错,中间有一次正常,程序继续往后走
@retry(stop_max_attempt_number=3)
def parse1_url(url):
print("*"*30) #打印分隔符测试
response = requests.get(url, headers=header1, timeout=5)
return response.content.decode()
def parse_url(url):
try:
html_str = parse1_url(url)
except:
html_str = None
return html_str
#main
if __name__ == '__main__': #输入 main
url = "http://www.baidu.com"
print(parse_url(url)[:100])
#用错的地址测报错3次
url1= "www.baidu.com"
print(parse_url(url1))