import requests
import re
import os
from urllib.request import urlretrieve
def download_vedio():
'''下载梨视频'''
html = requests.get('https://www.pearvideo.com/category_8').text
reg= r'<a href="(.*?)" class="vervideo-lilink actplay">'
vedio_id = re.findall(reg,html)
vedio_url = []
starturl = 'https://www.pearvideo.com/'
for id in vedio_id:
newurl = starturl+id
vedio_url.append(newurl)
for playurl in vedio_url:
html = requests.get(playurl).text
reg = r'srcUrl="(.*?)",vdoUrl=srcUrl'
purl = re.findall(reg,html)
reg = r'<h1 class="video-tt">(.*?)</h1>'
vedio_name = re.findall(reg,html)
print('正在下载视频:%s'%vedio_name[0])
path = 'vedio'
if path not in os.listdir():
os.mkdir(path)
filepath = path + '/%s.mp4'%vedio_name[0]
urlretrieve(purl[0],filepath)
download_vedio()