python爬虫爬取古诗词内容,并存入mysql
爬取结果展示:
代码如下:
from urllib import request
import re,os
import pymysql
import time
base_url = "https://so.gushiwen.org"
shiwen_url='https://www.gushiwen.org/shiwen/'
def get_model_url(shiwen_url):
html=get_html(shiwen_url)
res = '<a href="https://so\.gushiwen\.org/(.*?)\.aspx">(.*?)</a>'
urls=re.compile(res).findall(html)
return urls
def conn_mysql():
url = '49.4.71.22'
username = 'admin'
password = 'admin963'
dbname = 'test'
db=pymysql.connect(url,username,password,dbname)
return db
def createtable_poem():
sql='create table if not exists poem(model_name varchar(50),poem_name varchar(50),' \
'author_name varchar(50),dynasty var