1.导入模块
import requests
2.模仿浏览器的请求头中写明自己身份
headers = {‘User-Agent’: ‘Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36’}
3.爬取的网址
url = ‘http://tieba.baidu.com/f?kw=传智播客&ie=utf-8&pn=100’
4.返回结果
response = requests.get(url,headers=headers)
5.在pacharm中展示结果
print(response.content.decode())
#6. 写入同文件夹下创建的文件中
with open(‘贴吧第三页.html’,‘wb’) as f:
f.write(response.content)