python 基于百度图片搜索

最新推荐文章于 2023-09-20 14:27:59 发布

原创最新推荐文章于 2023-09-20 14:27:59 发布 · 799 阅读

1 ·

CC 4.0 BY-SA版权

文章标签：

#python #爬虫

爬虫篇专栏收录该内容

6 篇文章

订阅专栏

此博客围绕Python爬虫展开，虽未给出具体内容，但可知聚焦于利用Python进行数据爬取，Python作为后端开发常用语言，在爬虫领域有广泛应用，能高效获取网络数据。

#! /user/bin/python
# -*- coding: utf-8 -*-
# Author: chen
# Date 06/12
import  requests
import  re  #导入正则表达式  提取所需要的内容
import  random
def spiderPic(html,keyword):
    print('正在查找：'+keyword+'对应的文件，正在从百度中查找！！！')
    for addr in re.findall('"objURL":"(.*?)"',html,re.S):
        print('现在正在爬取URL中的地址：'+str(addr)[0:30]+'...')
        try:
            pic = requests.get(addr,timeout=10)
        except requests.exceptions.ConnectionError:
            print('您当前的URL出现错误！')
            continue

        fn = open('D:\\Python\\image\\'+(str(random.randrange(0,1000,4))+'.jpg'),'wb')
        fn.write(pic.content)
        fn.close()



if __name__ =='__main__':
     print('python')
     word = input('请输入您想要爬取的关键词：')
     resource = requests.get('http://image.baidu.com/search/index?tn=baiduimage&ps=1&ct=201326592&lm=-1&cl=2&nc=1&ie=utf-8&word='+word)
# 调用函数
spiderPic(resource.text,word)