selenium无法迭代元素

时间:2016-10-11 06:08:57

标签: python selenium web-scraping

我试图翻译tripadvisor的用户评论 我的代码: -

1.]仅选择葡萄牙语评论(来自语言下拉列表),

2.]然后展开每条评论,

3.]然后将所有这些扩展的评论保存在列表中

4.]然后将它们翻译成英语&在屏幕上打印

from selenium import webdriver
from selenium.webdriver.common.by import By
import time
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
com_=[] # To save translated comments
expanded_comments=[] # To save expanded comments
driver = webdriver.Chrome("C:\Users\shalini\Downloads\chromedriver_win32\chromedriver.exe")
driver.maximize_window()

def expand_reviews(driver):
    # TRYING TO EXPAND REVIEWS (& CLOSE A POPUP)    
    try:
        driver.find_element_by_class_name("moreLink").click()
    except:
        print "err"
    try:
        driver.find_element_by_class_name("ui_close_x").click()
    except:
        print "err"
    try:
        driver.find_element_by_class_name("moreLink").click()
    except:
        print "err3"




def save_comments(driver):
    expand_reviews(driver)
    # SELECTING ALL EXPANDED COMMENTS
    expanded_com_elements=driver.find_elements_by_class_name("entry")
    time.sleep(3)
    for i in expanded_com_elements:
        expanded_comments.append(i.text)


    # SELECTING ALL GOOGLE-TRANSLATOR links
    gt= driver.find_elements(By.CSS_SELECTOR,".googleTranslation>.link")

    # NOW PRINTING TRANSLATED COMMENTS
    for i in gt:
        try:
            driver.execute_script("arguments[0].click()",i)
            #i.click().perform()
            com=driver.find_element_by_class_name("ui_overlay").text
            com_.append(com)
            time.sleep(5)
            driver.find_element_by_class_name("ui_close_x").click().perform()
            time.sleep(5)
        except Exception as e:
            pass
            #print e



for i in range(282):
    page=i*10
    url="https://www.tripadvisor.com/Airline_Review-d8729164-Reviews-Cheap-Flights-or"+str(page)+"-TAP-Portugal#REVIEWS"
    driver.get(url)
    wait = WebDriverWait(driver, 10)
    if i==0:
        # SELECTING PORTUGUESE COMMENTS ONLY # Run for one time then iterate over pages
        try:
            langselction = wait.until(EC.element_to_be_clickable((By.CSS_SELECTOR, "span.sprite-date_picker-triangle")))
            langselction.click()
            driver.find_element_by_xpath("//div[@class='languageList']//li[normalize-space(.)='Portuguese first']").click()
            time.sleep(5)
        except Exception as e:
            print e

    save_comments(driver)

===== ERROR =================

expanded_comments返回空列表。有些评论会被保存,有些评论会被删除。 正确保存第一页(扩展所有注释),但此后只保存第一条注释而不进行扩展。但是,所有页面的翻译评论都会在com _

中正确保存

1 个答案:

答案 0 :(得分:1)

我已经更改了您的代码,现在它正在运行。

from selenium import webdriver
from selenium.webdriver.common.by import By
import time
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC

driver = webdriver.Chrome("./chromedriver.exe")
driver.maximize_window()
url="https://www.tripadvisor.com/Airline_Review-d8729164-Reviews-Cheap-Flights-TAP-Portugal#REVIEWS"
driver.get(url)
wait = WebDriverWait(driver, 10)



# SELECTING PORTUGUESE COMMENTS ONLY
#show_lan = driver.find_element_by_xpath("//div[@class='languageList']/ul/li[contains(text(),'Portuguese first')]")

try:
    langselction = wait.until(EC.element_to_be_clickable((By.CSS_SELECTOR, "span.sprite-date_picker-triangle")))
    langselction.click()
    driver.find_element_by_xpath("//div[@class='languageList']//li[normalize-space(.)='Portuguese first']").click()
    time.sleep(5)
except Exception as e:
    print e


# TRYING TO EXPAND REVIEWS (& CLOSE A POPUP)    
try:
    driver.find_element_by_class_name("moreLink").click()
except:
    print "err"
try:
    driver.find_element_by_class_name("ui_close_x").click()
except:
    print "err"
try:
    driver.find_element_by_class_name("moreLink").click()
except:
    print "err3"

# SELECTING ALL EXPANDED COMMENTS
expanded_com_elements=driver.find_elements_by_class_name("entry")
expanded_comments=[]
time.sleep(3)
for i in expanded_com_elements:
    expanded_comments.append(i.text)

# SELECTING ALL GOOGLE-TRANSLATOR links
gt= driver.find_elements(By.CSS_SELECTOR,".googleTranslation>.link")

# NOW PRINTING TRANSLATED COMMENTS
for i in gt:
    try:
        driver.execute_script("arguments[0].click()",i)
        #i.click().perform()
        print driver.find_element_by_class_name("ui_overlay").text
        time.sleep(5)
        driver.find_element_by_class_name("ui_close_x").click().perform()
        time.sleep(5)
    except Exception as e:
        pass
        #print e