2021-10-10
2021-10-10 本文已影响0人
月夜星空下
# 从selenium里面导入webdriver
from time import sleep
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.options import Options
from selenium.webdriver.support import expected_conditions as EC
chrome_options = Options()
chrome_options.add_argument("--headless")
chrome_options.add_argument("--disable-gpu")
# 执行到这里的时候Selenium会到指定的路径将chrome driver程序运行起来
# driver = webdriver.Chrome()
# driver = webdriver.Firefox()#这里是火狐的浏览器运行方法
browser = webdriver.Chrome(executable_path=r'D:\tools\chromedriver.exe', options=chrome_options)
# get 方法 打开指定网址
browser.get('http://www.sse.com.cn/disclosure/credibility/supervision/measures/')
# browser.get('http://www.sse.com.cn/disclosure/credibility/members/disposition/')
# table = browser.find_element_by_xpath('//*[@id="panel-1"]/div[1]/div/table')
# print(table)
# # print(table)
# for i in table:
# print(i)
pageSource = browser.page_source
print(pageSource)
# table = browser.find_element_by_xpath('/html/body/div[8]/div[2]/div[2]/div[2]/div/div/div/div/div[2]/div[1]/div/table')
# print(table)
# table_list = [] # 存放table数据
# for tr in table.find_elements_by_tag_name('tr'): # 遍历每一个tr
# print(tr.text)
# print(tr.get_attribute('href'))
# 将每一个tr的数据根据td查询出来,返回结果为list对象
# table_td_list = tr.find_elements(By.TAG_NAME, "td")
# row_list = []
# # print(table_td_list)
# for td in table_td_list: # 遍历每一个td
# print(td.get_attribute('title'))
# row_list.append(td.text) # 取出表格的数据,并放入行列表里
# table_list.append(row_list)
# print(row_list)
# print(row_list)
# tr = table.find_elements_by_tag_name('tr')
# print(tr)
# for i in tr:
# table_td_list = tr.find_elements(By.TAG_NAME, "td")
# # td = i.find_elements_by_tag_name('td')
# # for j in td:
# # print(j.text)
# print('-' * 100)
# for i in table:
# print(i)
# tr = i.find_elements_by_tag_name('tbody')
# print(tr)
# x = table_ele.find_elements_by_tag_name('tr')
# print(x)
# rows = table_ele.find_elements_by_tag_name("tr")
# print(rows)
# rows = table_ele.find_elements_by_tag_name("tr") # 定位table下的tr标签
# td_content = element.find_elements_by_tag_name("table")
# print(td_content)
# for i in element[0]:
# print(i)
# def next_page(page):
# try:
# next = wait.until(EC.element_to_be_clickable((By.CSS_SELECTOR, '.classPage') and (By.CSS_SELECTOR, "[page='{}']".format(page))))
# next.click()
# sleep(2)
# get_products()
# return True
# except:
# return False