Python的網路爬蟲小系統——爬取京東商城商品資訊
阿新 • • 發佈:2019-02-04
import time from selenium import webdriver keyword = input('請輸入你要搜尋的關鍵字:') brow = webdriver.Firefox() brow.get('http://www.jd.com') search_form = brow.find_element_by_id('key') search_form.send_keys(keyword) search_button = brow.find_element_by_class_name('button') search_button.click() time.sleep(2) file_handle = open('%s.txt'%keyword,mode='w',encoding='utf-8') for x in range(1,6): print('正在爬取第%s頁資料,請稍等'%x) for x in range(1,11,2): time.sleep(1) j = x / 10 js = 'document.documentElement.scrollTop = document.documentElement.scrollHeight * %f' % j brow.execute_script(js) shops = brow.find_elements_by_class_name('gl-item') for shop in shops: file_handle.write(shop.text) next_li = brow.find_element_by_class_name('pn-next') next_li.click() brow.quit()