#尝试抓取数量较多时,会提示403 forbidden,一次抓取20张图片就不会有问题 url = 'https://image.so.com/j?q=%E9%A9%AC%E8%87%AA%E8%BE%BE&pd=1&pn=19&correct=%E9%A9%AC%E8%87%AA%E8%BE%BE&adstar=0&tab=all&sid=6ab4e6d3289b0d0be6bb0e4219031698&ras=6&cn=0&gn=0&kn=50&crn=0&bxn=20&cuben=0&pornn=0&manun=41&src=srp&sn=1&ps=1&pc=1' headers = {"User-Agent":"Mozilla/5.0 (Windows NT 6.1; WOW64; rv:23.0) Gecko/20100101 Firefox/23.0","Referer":"https://image.so.com/i?q=%E9%A9%AC%E8%87%AA%E8%BE%BE&src=srp"} data = requests.get(url,headers=headers) jd = json.loads(data.text) jd = jd['list'] l = [] for j in jd: l.append(j['img']) m = 0 for img in l: # print(img) urllib.request.urlretrieve(img,"d:/download/"+str(m)+'.jpg') m = m + 1
10-24
2079

12-21