import urllib.request
# 这里是https
url ='https://www.baidu.com'
# 协议(http,https)、主机、端口号、路径、参数、锚点
# http:80 https:443
# 这里失效了,我们加上UA
# response = urllib.request.urlopen(url)
# content= response.read().decode('utf-8')
# print(content)
headers ={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36'
}
request =urllib.request.Request(url=url,headers=headers)
response = urllib.request.urlopen(request)
content= response.read().decode('utf-8')
print(content)
加上我们的UA:
headers ={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36'
}
看下效果: