05_python
2020-12-13 04:19
标签:int cli arch end sel cto port pre 链接 利用selenium去爬取京东商品信息 05_python 标签:int cli arch end sel cto port pre 链接 原文地址:https://www.cnblogs.com/RenJian666/p/11107952.htmlfrom selenium import webdriver
from selenium.webdriver.common.keys import Keys
import time
# 打开京东搜索手机商品
brower = webdriver.Chrome()
try:
brower.implicitly_wait(10)
brower.get("http://www.jd.com")
input_search = brower.find_element_by_id("key")
input_search.send_keys("手机")
input_search.send_keys(Keys.ENTER)
time.sleep(3)
good_list = brower.find_elements_by_class_name("gl-item")
num = int(brower.find_element_by_css_selector(".p-skip em b").text)
print(num)
i = 0
while i num:
for good in good_list:
# 获取到京东商品的URL
good_url = good.find_element_by_css_selector(".p-img a").get_attribute("href")
print(good_url)
# 获取到京东商品的名称
good_name = good.find_element_by_css_selector("a em").text
print(good_name)
# 获取到京东商品的价格
good_price = good.find_element_by_css_selector(".p-price strong").text
print(good_price)
# 获取到京东商品的评价数
good_commit = good.find_element_by_css_selector(".p-commit strong").text
print(good_commit)
# 将商品信息写入到文件中
good_info = f‘‘‘
商品名称:{good_name}
商品链接:{good_url}
商品价格:{good_price}
商品评价: {good_commit}
\n
‘‘‘
with open("jd_手机商品信息.txt", "a", encoding="utf-8") as f:
f.write(good_info)
# 点击京东下一页
next_page = brower.find_element_by_class_name("pn-next").click()
time.sleep(3)
# 再次获取到京东页面商品
good_list = brower.find_elements_by_class_name("gl-item")
# 自增
i = i+1
except Exception as e:
print(e)
finally:
time.sleep(10)
brower.close()
上一篇:算法整理-并查集和分治
下一篇:统计两个数组中相同元素的个数