1. 程式人生 > >爬取京東商城商品信息

爬取京東商城商品信息

final finall pan __name__ cit spi web 爬取 webdriver

from selenium import webdriver
from selenium.webdriver import ActionChains
from selenium.webdriver.common.by import By #按照什麽方式查找,By.ID,By.CSS_SELECTOR
from selenium.webdriver.common.keys import Keys #鍵盤按鍵操作
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.support.wait import
WebDriverWait #等待頁面加載某些元素 import time def get_goods(driver): try: goods=driver.find_elements_by_class_name(gl-item) for good in goods: detail_url=good.find_element_by_tag_name(a).get_attribute(href) p_name=good.find_element_by_css_selector(
.p-name em).text.replace(\n,‘‘) price=good.find_element_by_css_selector(.p-price i).text p_commit=good.find_element_by_css_selector(.p-commit a).text msg = ‘‘‘ 商品 : %s 鏈接 : %s 價錢 :%s 評論 :%s
‘‘‘ % (p_name,detail_url,price,p_commit) print(msg,end=\n\n) button=driver.find_element_by_partial_link_text(下一頁) button.click() time.sleep(1) get_goods(driver) except Exception: pass def spider(url,keyword): driver = webdriver.Chrome() driver.get(url) driver.implicitly_wait(3) # 使用隱式等待 try: input_tag=driver.find_element_by_id(key) input_tag.send_keys(keyword) input_tag.send_keys(Keys.ENTER) get_goods(driver) finally: driver.close() if __name__ == __main__: spider(https://www.jd.com/,keyword=iPhone8手機) 爬取京東商城商品信息

爬取京東商城商品信息