1.导入基本的urllib的库,以及re.os.time的库.
import urllib.request
import urllib.parse
import re
import os
import time
2.设置url和headers.
image_url = 'http://www.youmei8.com/meizitu/1859.html'
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.110 Safari/537.36',
}
3.获取网页.
request = urllib.request.Request(url = image_url, headers = headers)
response = urllib.request.urlopen(request)
response = response.read().decode()
# print(response)
4.正则匹配当前网页所有图片链接.
pattern = re.compile(r'.*?<img alt="" src="(.*?)".*?>.*?', re.S)
lt = pattern.findall(response)
# print(lt)
5.for循环下载所有的图片,以及创建文件夹和图片命名和提示信息.
for img in lt:
imgname = img.split('/')[-1]
dirname = '白色蕾丝装'
if not os.path.exists(dirname):
os.mkdir(dirname)
img_name = dirname + '/' + imgname
print('%s图片正在下载...' % imgname)
urllib.request.urlretrieve(img, img_name)
print('%s图片下载完成...' % imgname)
time.sleep(1)
print('%s专辑下载完成' % dirname)
dirname为文件名,url为http://www.youmei8.com/的专辑链接.