在douban上指定图片的网址.
import requests
from lxml import etree
url="https://movie.douban.com/subject/34867871/photos?type=W"
headers={"User-Agent":"mozilla/4.0 (compatible; MSIE 5.5; Windows NT)"}
page=requests.get(url=url,headers=headers).text
tree=etree.HTML(page)
num=tree.xpath('//div[@class="article"]//li')
a=1
for i in num:
name="picters/"+f"{a}"+".jpg"
path=i.xpath('.//img/@src')[0]
data=requests.get(url=path,headers=headers).content
f=open(name,"wb")
f.write(data)
f.close()
a+=1
print(name,"yes!!!")
url=tree.xpath('//span[@class="next"]/a/@href')
while url:
url=url[0]
page = requests.get(url=url, headers=headers).text
tree = etree.HTML(page)
num = tree.xpath('//div[@class="article"]//li')
for i in num:
name = "picters/" + f"{a}" + ".jpg"
path = i.xpath('.//img/@src')[0]
data = requests.get(url=path, headers=headers).content
f = open(name, "wb")
f.write(data)
f.close()
a += 1
print(name, "yes!!!")
url = tree.xpath('//span[@class="next"]/a/@href')