在网页数据面打开检查,利用精确定位标签对应网页源代码的位置,在点击network ,可以通过改按钮获取浏览器信息、cookie信息,并且找到数据接口




import requests
response = requests.get('https://game.gtimg.cn/images/lol/act/img/js/heroList/hero_list.js')
result = response.json()
for x in result['hero']:
print(x['name'])
from selenium.webdriver import Chrome
b = Chrome()
b.get('https://movie.douban.com/top250')
print(b.page_source)
b.close()
b = Chrome()
b.get('https://www.jd.com')
input_tag = b.find_element_by_id('key')
input_tag.send_keys('电脑\n')
print(b.page_source)
btn = b.find_element_by_css_selector('#navitems-group2 .b')
btn.click()
from selenium.webdriver import Chrome
from time import sleep
from bs4 import BeautifulSoup
import csv
import lxml
f = open('files/手机数据.csv', 'w', encoding='utf-8')
writer = csv.writer(f)
writer.writerow(['商品','价格'])
def analysis_data(html: str):
soup = BeautifulSoup(html,'lxml')
all_iphone = soup.select('#J_goodsList>ul>li>div.gl-i-wrap')
# print(all_iphone)
phone = []
for iphone in all_iphone:
name = iphone.select_one('.p-name em').text
price = iphone.select_one('.p-price i').text
phone.append([name, price])
writer.writerows(phone)
return phone
b = Chrome()
# 1.输入框输入内容
b.get('https://www.jd.com')
# a.找到输入框标签
input_tag = b.find_element_by_id('key')
# b.在输入框输入内容
input_tag.send_keys('手机\n')
sleep(2)
# c.第一页获取手机页面数据
result = b.page_source
analysis_data(result)
sleep(2)
# # 2.点击按钮
# # 点击第二页
btn = b.find_element_by_css_selector('#J_bottomPage>span>.pn-next')
btn.click()
# 获取第二页手机页面数据
sleep(2)
result1 = b.page_source
analysis_data(result1)
f.close()
input('是否结束:')
b.close()
from selenium.webdriver import Chrome
from time import sleep
from bs4 import BeautifulSoup
# 1. 基本操作
b = Chrome() # 创建浏览器
b.get('https://www.cnki.net/') # 打开中国*网
search_tag = b.find_element_by_id('txt_SearchText') # 获取输入框
search_tag.send_keys('数据分析\n') # 输入框输入'数据分析',然后按回车
sleep(1) # 切换界面最后做一个等待操作
# 获取需要点击的所有标签: 如果拿到标签后需要点击或者输入,必须通过浏览器获取标签
all_result = b.find_elements_by_css_selector('.result-table-list .name>a')
# 点击第一个结果(这儿会打开一个新的选项卡)
all_result[0].click()
sleep(1)
# 跳转到窗口(获取所有窗口)
b.switch_to.window(b.window_handles[-1])
soup = BeautifulSoup(b.page_source, 'lxml')
result = soup.select_one('#ChDivSummary').text
print(result)
b.close() # 关闭当前指向的窗口(最后一个窗口),窗口关闭后,浏览器对象的指向不会发生改变
# 回到第一个窗口,点击下一个搜索结果
b.switch_to.window(b.window_handles[0])
all_result[1].click()
sleep(1)
b.switch_to.window(b.window_handles[-1])
soup = BeautifulSoup(b.page_source, 'lxml')
result = soup.select_one('#ChDivSummary').text
print(result)
b.close()
input('结束:')
b.close()