《2018年8月24日》【连续325天】
标题:pyspider图片爬取实例尝试;
内容:
参考1:https://cuiqingcai.com/2652.html
模仿这个写了个代码:
def __init__(self):
self.base_url = 'https://bcy.net/huodong/176?&p='
self.page_num = 1
self.total_num = 20
self.deal = Deal()
@every(minutes=24 * 60)
def on_start(self):
while self.page_num <= self.total_num:
url = self.base_url + str(self.page_num)
print(url)
self.crawl(url, callback=self.index_page,validate_cert=False)
self.page_num += 1
@config(age=10 * 24 * 60 * 60)
def index_page(self, response):
for each in response.doc('.db.ovf').items():
self.crawl(each.attr.href, callback=self.detail_page,validate_cert=False)
@config(priority=2)
def detail_page(self, response):
img = response.doc('.content-img-wrap img').attr.src
self.crawl(img, callback=self.save_img,validate_cert=False)
结果没图。可能是标签找错了,明天改一下;
2.:https://blog.youkuaiyun.com/u013919836/article/details/68066715