一、Python BeautifulSoup解析HTML获取图片URL并下载到本地
import os
import bs4
import requests
url = 'https://www.jdlingyu.com/145853.html'
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/137.0.0.0 Safari/537.36"
}
os.makedirs('JDLY', exist_ok=True)
try:
mainRequest = requests.get(url, headers)
mainRequest.raise_for_status()
soup = bs4.BeautifulSoup(mainRequest.text, 'html.parser')
imgUrls = []
imgUrls = soup.select('.entry-content img')
for imgUrl in imgUrls:
url = imgUrl.get('data-src')
img = requests.get(url, headers=headers).content
with open(os.path.join('JDLY//',os.path.basename(url)), mode='wb') as f:
f.write(img)
except Exception as e:
print(f"获取图片异常:" + str(e))