使用Selenium和python进行爬取

时间:2018-07-31 11:08:10

标签: python selenium web-scraping

Numbers are in chart 我正在尝试获取14401之类的数字。我尝试过

WebDriverWait(driver, 10).until(EC.frame_to_be_available_and_switch_to_it((By.XPATH,"//iframe[@id='wiz-iframe-intent']")))
WebDriverWait(driver, 10).until(EC.element_to_be_clickable((By.XPATH, '//*[@id="highcharts-5tawcvw-0"]/svg/g[8]/g[1]/text/tspan[1]'))).text

获取超时异常。

1 个答案:

答案 0 :(得分:1)

该特定元素位于 SVG中。,您可以遵循以下代码:

from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC 
from selenium.webdriver.common.action_chains import ActionChains
from selenium.webdriver.support.select import Select
import time

driver = webdriver.Chrome(executable_path = r'D:/Automation/chromedriver.exe')
driver.maximize_window()
driver.get("https://eu1.dashboard.clevertap.com/login.html")

wait = WebDriverWait(driver, 20)
action = ActionChains(driver)
wait.until(EC.frame_to_be_available_and_switch_to_it((By.ID,"wiz-iframe-intent")))
wait.until(EC.element_to_be_clickable((By.XPATH, "//div[@class='CT_Interstitial']//span[@class='CT_InterstitialClose']"))).click()

driver.switch_to.default_content()

wait.until(EC.element_to_be_clickable((By.NAME, "email"))).send_keys("username")

wait.until(EC.element_to_be_clickable((By.NAME,"password"))).send_keys("****")  

wait.until(EC.element_to_be_clickable((By.ID,"submitBtn"))).click()

wait.until(EC.visibility_of_element_located((By.CSS_SELECTOR, 'div.ct-breadcrumb')))

try:
    wait.until(EC.frame_to_be_available_and_switch_to_it((By.ID,"wiz-iframe-intent")))
    wait.until(EC.element_to_be_clickable((By.CSS_SELECTOR, "div.close-btn.js-close-popup>button"))).click()
except:
    pass

driver.switch_to.default_content()  
action.move_to_element(driver.find_element_by_css_selector("div.sidebar__brand+ul>li:first-child>a")).perform()

wait.until(EC.visibility_of_element_located((By.LINK_TEXT, "All Boards")))  

wait.until(EC.element_to_be_clickable((By.LINK_TEXT,"All Boards"))).click()

wait.until(EC.element_to_be_clickable((By.LINK_TEXT,"pe-funnel"))).click()

wait.until(EC.visibility_of_element_located((By.XPATH, "//*[name()='tspan' and contains(@stroke-linejoin,'round')]"))) 

all_data = driver.find_elements_by_xpath("//*[name()='tspan' and contains(@stroke-linejoin,'round')]")

print(len(all_data))

for data in all_data:
 print(data.text)