2016-11-23 74 views
0

我试图从https://www.bcbsga.com/health-insurance/provider-directory/searchcriteria中检索医生姓名,他们的地址和其他字段。我在下面附上我的代码。我不确定在最后的'for'循环中有什么问题,我得到了下面的输出,而不是网站上的数据。Python Selenium Webdriver - 从网站检索连续数据

selenium.webdriver.remote.webelement.WebElement (会话= “ba8c85ad6e398939063d5b43ee513668”,元素= “0.6436841330730552-19”)> selenium.webdriver.remote.webelement.WebElement(会话= “ba8c85ad6e398939063d5b43ee513668”,元素=” 0.6436841330730552-20“)>

import time 
from selenium import webdriver 
from selenium.webdriver.common.keys import Keys 

divID = 'ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireInsurance_chosen' 
inputID = 'ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireInsurance_chosen_input' 
inputValue = 'I buy it myself (or plan to buy it myself)' 

driver = webdriver.Chrome() 

driver.get("https://www.bcbsga.com/health-insurance/provider-directory/searchcriteria") 
driver.find_element_by_id("btnGuestContinue").click() 
driver.implicitly_wait(10) 

driver.find_element_by_id('ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireInsurance_chosen').click() 
driver.find_element_by_id('ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireInsurance_chosen_input').send_keys('I buy it myself (or plan to buy it myself)') 
driver.find_element_by_id('ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireInsurance_chosen_input').send_keys(Keys.RETURN) 

driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireWhobought_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireWhobought_chosen_input").send_keys("Marketplace/exchanges") 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireWhobought_chosen_input").send_keys(Keys.RETURN) 

driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireState_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireState_chosen_input").send_keys("Georgia") 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlQuestionnaireState_chosen_input").send_keys(Keys.RETURN) 

driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlCareTypes_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlCareTypes_chosen_input").send_keys("Medical") 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlCareTypes_chosen_input").send_keys(Keys.RETURN) 

driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlquestionnairePlanNetworks_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlquestionnairePlanNetworks_chosen_input").send_keys("All plans/networks selection") 
driver.find_element_by_id("ctl00_MainContent_maincontent_PFPlanQuestionnaire_ddlquestionnairePlanNetworks_chosen_input").send_keys(Keys.RETURN) 

driver.find_element_by_id("btnGuestQuestionnaireContinue").click() 

#'located near' field 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_pfLocationSearch_txtZipCityState").send_keys("30303") 

#within a distance of 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_pfLocationSearch_ddlRadius_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_pfLocationSearch_ddlRadius_chosen_input").send_keys("10 miles") 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_pfLocationSearch_ddlRadius_chosen_input").send_keys(Keys.RETURN) 
#speciality 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_ddlSpeciality_chosen").click() 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_ddlSpeciality_chosen_input").send_keys("Cardiology") 
driver.find_element_by_id("ctl00_MainContent_maincontent_pfSearchMain_ddlSpeciality_chosen_input").send_keys(Keys.RETURN) 
#click the search button 
driver.find_element_by_id("btnSearch").click() 
time.sleep(10) 

for i in range(10): 
     name = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lnkName") 
     address = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lblAddress") 
     print(name, address) 

driver.close() 

回答

1

的问题是,find_element_by_id应返回的网络元素,而不是文本节点,所以很明显nameaddress是网页元素。您应该使用

for i in range(10): 
    name = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lnkName").text 
    address = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lblAddress").text 
    print(name, address) 
1

我想我在最后的'for'循环中省略了.text字段。添加它们会检索元素的名称!

for i in range(10): 
     name = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lnkName").text 
     address = driver.find_element_by_id("ctl00_ResultsList_ctrl" + str(i) + "_lblAddress").text 
     print(name, address) 
+0

也许你应该检查你的脚本的最后两行... – gus27

+0

是的,我懂了工作,犯了一个错误,而编辑在这里。谢谢! – Srikanth