首页 > 其他 > 详细

selenium滚动条应用,爬永远讲不完的故事

时间:2019-03-25 23:00:56      阅读:156      评论:0      收藏:0      [点我收藏+]
from selenium import webdriver


class Lj(object):
def __init__(self):
self.driver = webdriver.Chrome()
url = ‘http://www.99lib.net/book/1222/34747.htm‘
self.driver.get(url)
self.driver.maximize_window()
self.driver.implicitly_wait(10)

# 获取标题
def get_title(self):
dr = self.driver
title = dr.find_element_by_xpath(‘//*[@id="content"]/h2‘).text
return title

# 获取内容
def get_content(self):
dr = self.driver
content = dr.find_element_by_xpath(‘//*[@id="content"]‘).text
return content

# 保存
def file(self,data):
with open(‘永远讲不完的故事.txt‘,‘a‘,encoding=‘utf-8‘) as f:
f.write(data + ‘\n‘)

def gun(self):
dr = self.driver
js = "var q=document.documentElement.scrollTop=100000"
dr.execute_script(js)

# 翻页
def next(self):
dr = self.driver
dr.find_element_by_link_text(‘下一页‘).click()

# 执行
def run(self):
dr = self.driver
title = self.get_title()
print(title)
while True:
try:
el = dr.find_element_by_link_text(‘下一页‘)
content = self.get_content()
self.file(title)
self.file(content)
self.next()
break
except:
self.gun()


a = Lj()
while True:
a.run()


selenium滚动条应用,爬永远讲不完的故事

原文:https://www.cnblogs.com/sleep10000years/p/10597232.html

(0)
(0)
   
举报
评论 一句话评论(0
关于我们 - 联系我们 - 留言反馈 - 联系我们:wmxa8@hotmail.com
© 2014 bubuko.com 版权所有
打开技术之扣,分享程序人生!