python从知网上下载验证码 保存到本地
#!/bin/python
#coding="utf-8"
import requests
from lxml import etree
import os
import time
picPath = 'D:\\py\\murphy\\tesseract\\pic'
URL = 'http://my.cnki.net/elibregister/commonRegister.aspx#'
headers = {
'User-Agent':'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.103 Safari/537.36'
}
def download_img(num):
filename = os.path.join(picPath,str(num)+'.png')
response = requests.get(URL,headers = headers)
if response.status_code == 200:
content = response.text
html = etree.HTML(content)
img_url = 'http://my.cnki.net/elibregister/'+html.xpath('//*[@id="checkcode"]/@src')[0]
html_img = requests.get(img_url)
with open(filename, 'wb') as fd:
fd.write(html_img.content)
def main(begin,end):
for i in range(begin,end):
download_img(i)
time.sleep(3)
if __name__ == "__main__":
main(1,101)