一、爬取汽车之家新闻
- pip3 install beautifulsoup4
- pip3 install lxml
import pymysql
import requests
from bs4 import BeautifulSoup
res=requests.get('https://www.autohome.com.cn/news/1/#liststart')
print(res.text)
soup=BeautifulSoup(res.text,'lxml')
conn=pymysql.Connect(host='127.0.0.1', user='root', password="123",database='qc', port=3306)
cursour=conn.cursor()
ul_list=soup.find_all(name='ul',class_='article')
for ul in ul_list:
li_list=ul.find_all('li')
for li in li_list:
h3=li.find('h3')
if h3:
title=h3.text
desc=li.find