from selenium import webdriver
from selenium.webdriver.chrome.options import Options
import time
# 创建一个参数对象,用来控制chrome以无界面模式打开
chrome_options = Options()
chrome_options.add_argument(‘--headless‘)
chrome_options.add_argument(‘--disable-gpu‘)
# 驱动路径
path = r‘./chromedriver.exe‘
# 创建浏览器对象
browser = webdriver.Chrome(executable_path=path, chrome_options=chrome_options)
# 上网
url = ‘http://www.baidu.com/‘
browser.get(url)
time.sleep(3)
browser.save_screenshot(‘baidu.png‘)
browser.quit()
from selenium import webdriver
from lxml import etree
import time
from selenium.webdriver.chrome.options import Options
chrome_options = Options()
chrome_options.add_argument(‘--headless‘)
chrome_options.add_argument(‘--disable-gpu‘)
bro = webdriver.Chrome(executable_path=‘./chromedriver.exe‘,chrome_options=chrome_options)
#让浏览器对指定url发起访问
bro.get(‘http://125.35.6.84:81/xk/‘)
#获取浏览器当前打开页面的页面源码数据(可见即可得)
page_text = bro.page_source
time.sleep(2)
tree = etree.HTML(page_text)
name = tree.xpath(‘//*[@id="gzlist"]/li[1]/dl/a/text()‘)[0]
print(name)
time.sleep(3)
bro.quit()
import requests
from selenium import webdriver
from lxml import etree
import time
driver = webdriver.Chrome(executable_path=‘./chromedriver.exe‘)
driver.get(‘https://qzone.qq.com/‘)
# 在web 应用中经常会遇到frame 嵌套页面的应用,使用WebDriver 每次只能在一个页面上识别元素,对于frame 嵌套内的页面上的元素,直接定位是定位是定位不到的。这个时候就需要通过switch_to_frame()方法将当前定位的主体切换了frame 里。
driver.switch_to.frame(‘login_frame‘)
driver.find_element_by_id(‘switcher_plogin‘).click()
# driver.find_element_by_id(‘u‘).clear()
driver.find_element_by_id(‘u‘).send_keys(‘328410948‘) # 这里填写你的QQ号
# driver.find_element_by_id(‘p‘).clear()
driver.find_element_by_id(‘p‘).send_keys(‘xxxxxx‘) # 这里填写你的QQ密码
driver.find_element_by_id(‘login_button‘).click()
time.sleep(2)
# driver.execute_script(‘window.scrollTo(0,document.body.scrollHeight)‘)
# time.sleep(2)
# driver.execute_script(‘window.scrollTo(0,document.body.scrollHeight)‘)
# time.sleep(2)
# driver.execute_script(‘window.scrollTo(0,document.body.scrollHeight)‘)
# time.sleep(2)
# page_text = driver.page_source
#
# tree = etree.HTML(page_text)
# # 执行解析操作
# li_list = tree.xpath(‘//ul[@id="feed_friend_list"]/li‘)
# for li in li_list:
# text_list = li.xpath(‘.//div[@class="f-info"]//text()|.//div[@class="f-info qz_info_cut"]//text()‘)
# text = ‘‘.join(text_list)
# print(text + ‘\n\n\n‘)
driver.close()