1. 程式人生 > >Python的網路爬蟲小系統——爬取京東商城商品資訊

Python的網路爬蟲小系統——爬取京東商城商品資訊

import time
from selenium import webdriver
keyword = input('請輸入你要搜尋的關鍵字:')
brow = webdriver.Firefox()
brow.get('http://www.jd.com')
search_form = brow.find_element_by_id('key')
search_form.send_keys(keyword)
search_button = brow.find_element_by_class_name('button')
search_button.click()
time.sleep(2)
file_handle = open
('%s.txt'%keyword,mode='w',encoding='utf-8') for x in range(1,6): print('正在爬取第%s頁資料,請稍等'%x) for x in range(1,11,2): time.sleep(1) j = x / 10 js = 'document.documentElement.scrollTop = document.documentElement.scrollHeight * %f' % j brow.execute_script(js) shops = brow.find_elements_by_class_name('gl-item'
) for shop in shops: file_handle.write(shop.text) next_li = brow.find_element_by_class_name('pn-next') next_li.click() brow.quit()