代码如下:
import urllib.request
import re
for i in range(1,2):
url = "http://www.58pic.com/piccate/7-128-0-default-0_2_0_0_default_0-" + str(i) + ".html"
data = urllib.request.urlopen(url).read().decode("utf-8","ignore")
pat = '<a class="card-img video-play" target="_blank" href="(.*?)">'
imgUrlList = re.compile(pat).findall(data)
for j in range(0,len(imgUrlList)):
imgPageData = urllib.request.urlopen(imgUrlList[j]).read().decode("utf-8","ignore")
pat = 'src="(.*?)" class="show-area-pic"'
imgUrl = re.search(pat,imgPageData).group(1)
headers = { "Accept":"text/html,application/xhtml+xml,application/xml;",
"Accept-Encoding