一、获取ip代理代码:
# IP地址取自国内髙匿代理IP网站:http://www.xicidaili.com/nn/
# 爬取首页IP地址,分为HTTPS和HTTP两类
# 随机获取一个http的代理(注意:有可能选择到的这个ip代理不可用)
from bs4 import BeautifulSoup
import requests
import random
url = 'https://www.xicidaili.com/nn'
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) '
'AppleWebKit/537.36 (KHTML, like Gecko) Chrome/53.0.2785.143 Safari/537.36'}
def get_ip_list(url, headers):
try:
webdata = requests.get(url, headers=headers, timeout=10)
print(webdata.status_code)
soup = BeautifulSoup(webdata.text, 'html.parser')
ips = soup.find_all('tr')
# print(ips)
ips = ips[1:] # 因为第1个tr里面没有td
# for item in ips:
# print(item)
ip_httpslist1 = []
ip_httplist1 = []
for i in ra