from urllib import request,parse
from urllib.error import HTTPError,URLError
def get (url,headers=None):
return urlrequests(url,headers=headers)
def post(url,form,headers=None)
return urlrequests(url,form,headers=headers)
1传入url
2user_agent
3headers
4定义rquest
5urlopen
6返回byte数组
def urlrequests(url,form=None,headers=None):
user_agent=’Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36’
if headers==None:
headers{
‘User_Agent’:user_agent
}
html_bytes=b”
try:
if form:
forms_str=parse.urlencode(form)
form_bytes=form_str.encode(”utf-8)
req=request.Request(url,data=form_bytes,headers=headers)
else:
req=request.Request(url,headers=headers)
response=request.urlopen(req)
html_bayes=response.read()
except HTTPError as e:
print(e)
except URLError as e:
print(e)
return html_bytes
if name==’main’
url='http://baidu.com'
html_bytes=get(url)
print (html_byte)