程序贼简单,运行就知道了
import requests
import re
web_url='https://www.yunpanjingling.com/search/'
keyword=input('请输入搜索关键词:')
page=input('请输入要检索的总页数:')
headers = {'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1'}
def parse_page(response):
comment = re.findall('<a href=\"(.*?)\" target', response)
namee= re.findall('rel=\"nofollow\"> (.*?) <\/a>',response)
return comment,namee
#
pagee=1
while pagee<int(page)+1:
print('---------------第'+str(pagee)+'页---------------------')
url=web_url+keyword+'?page='+str(pagee)
response = requests.get(url=url,headers=headers).text
comment,namee = parse_page(response)
for x, y in zip(namee, comment):
print('\n')
print(x.replace('<em>','').replace('</em>',''))
print(y)
pagee+=1
运行截图: