#coding:utf-8 from selenium import webdriver from bs4 import BeautifulSoup as bs driver = webdriver.PhantomJS() driver.get("https://www.douyu.com/directory/all") while True: soup = bs(driver.page_source, "lxml") names = soup.find_all("h3", {"class": "ellipsis"}) numbers = soup.find_all("span", {"class": "dy-num fr"}) for name, number in zip(names, numbers): print u"观众人数: -" + number.get_text().strip() + u"-\t房间名: " + name.get_text().strip() if driver.page_source.find("shark-pager-disable-next") != -1: break driver.find_element_by_class_name("shark-pager-next").click() driver.quit()
斗鱼抓取
最新推荐文章于 2024-12-17 17:20:34 发布