2021-10-10

2021-10-10  本文已影响0人  月夜星空下
# 从selenium里面导入webdriver
from time import sleep
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.options import Options
from selenium.webdriver.support import expected_conditions as EC

chrome_options = Options()
chrome_options.add_argument("--headless")
chrome_options.add_argument("--disable-gpu")

# 执行到这里的时候Selenium会到指定的路径将chrome driver程序运行起来
# driver = webdriver.Chrome()
# driver = webdriver.Firefox()#这里是火狐的浏览器运行方法
browser = webdriver.Chrome(executable_path=r'D:\tools\chromedriver.exe', options=chrome_options)
# get 方法 打开指定网址
browser.get('http://www.sse.com.cn/disclosure/credibility/supervision/measures/')
# browser.get('http://www.sse.com.cn/disclosure/credibility/members/disposition/')

# table = browser.find_element_by_xpath('//*[@id="panel-1"]/div[1]/div/table')
# print(table)
# # print(table)
# for i in table:
#     print(i)
pageSource = browser.page_source
print(pageSource)

# table = browser.find_element_by_xpath('/html/body/div[8]/div[2]/div[2]/div[2]/div/div/div/div/div[2]/div[1]/div/table')
# print(table)

# table_list = []  # 存放table数据
# for tr in table.find_elements_by_tag_name('tr'):  # 遍历每一个tr
#     print(tr.text)
#     print(tr.get_attribute('href'))
    # 将每一个tr的数据根据td查询出来,返回结果为list对象
    # table_td_list = tr.find_elements(By.TAG_NAME, "td")
    # row_list = []
    # # print(table_td_list)
    # for td in table_td_list:  # 遍历每一个td
    #     print(td.get_attribute('title'))
    #     row_list.append(td.text)  # 取出表格的数据,并放入行列表里
    # table_list.append(row_list)
    # print(row_list)
    # print(row_list)

# tr = table.find_elements_by_tag_name('tr')
# print(tr)
# for i in tr:
#     table_td_list = tr.find_elements(By.TAG_NAME, "td")
#     #     td = i.find_elements_by_tag_name('td')
#     #     for j in td:
#     #         print(j.text)
#     print('-' * 100)
# for i in table:
#     print(i)
#     tr = i.find_elements_by_tag_name('tbody')
#     print(tr)


# x = table_ele.find_elements_by_tag_name('tr')
# print(x)

# rows = table_ele.find_elements_by_tag_name("tr")
# print(rows)
# rows = table_ele.find_elements_by_tag_name("tr")  # 定位table下的tr标签
# td_content = element.find_elements_by_tag_name("table")
# print(td_content)

# for i in element[0]:
#     print(i)


# def next_page(page):
#     try:
#         next = wait.until(EC.element_to_be_clickable((By.CSS_SELECTOR, '.classPage') and (By.CSS_SELECTOR, "[page='{}']".format(page))))
#         next.click()
#         sleep(2)
#         get_products()
#         return True
#     except:
#         return False

上一篇 下一篇

猜你喜欢

热点阅读