# coding=utf-8
from selenium import webdriver
import time
dr = webdriver.Chrome()
dr.maximize_window()
dr.get("http://www.godcom.net/hhb/")
dr.implicitly_wait(20)
fr_all = dr.find_element_by_name("I1")
dr.switch_to_frame(fr_all)
fr_1 = dr.find_element_by_name("map")
fr_2 = dr.find_element_by_name("bible")
dr.switch_to_frame(fr_1)
a = dr.find_elements_by_xpath("//table/tbody//a")
def test(value):
for i in a:
print(i.text)
if i.text == value:
i.click()
time.sleep(1)
dr.switch_to_default_content()
dr.switch_to_frame(fr_all)
dr.switch_to_frame(fr_2)
juan_name = dr.find_element_by_xpath("//h2").text
openfiles = open("E://"+juan_name+".txt", "a")
openfiles.write(juan_name + "\n"*2)
chapters = dr.find_elements_by_xpath("//body/table/tbody/tr/td[2]/a")
def write_txt():
time.sleep(1)
zjs = dr.find_elements_by_xpath("//p/table/tbody//td[1]")
zws = dr.find_elements_by_xpath("//p/table/tbody//td[2]")
for zj in range(len(zjs)):
if zjs[zj].text != " ":
result_txt = zjs[zj].text + " " + zws[zj].text
openfiles.write(result_txt + "\n")
for ch in range(len(chapters)+2):
chapter_xpath = "//body/table/tbody/tr/td[2]/a[text()='%d']" %(ch)
print(chapter_xpath)
if ch == 1:
write_txt()
if ch >=2:
dr.find_element_by_xpath(chapter_xpath).click()
write_txt()
dr.switch_to_default_content()
dr.switch_to_frame(fr_all)
dr.switch_to_frame(fr_1)
with open("E://result/圣经目录.txt") as dujing:
djlist = dujing.readlines()
for i in djlist:
juan = i.strip("\n")
test(juan)
time.sleep(10)
dr.quit()
爬取圣经demo
最新推荐文章于 2025-07-08 10:08:15 发布
717

被折叠的 条评论
为什么被折叠?



