selenium webdriver chrome 获取 文件 下载 链接 (js生成的链接,点击事件发送请求并弹窗的那种)

import json
from selenium import webdriver
from selenium.webdriver.chrome.options import Options
from selenium.webdriver.common.desired_capabilities import DesiredCapabilities

chrome_options = Options()

# 开启performance日志记录
caps = DesiredCapabilities.CHROME
caps['goog:loggingPrefs'] = {'performance': 'ALL'}
chrome_options.add_experimental_option('perfLoggingPrefs', {'enableNetwork': True})

DRIVER = webdriver.Chrome(executable_path="C:\python\chromedriver.exe", chrome_options=chrome_options,
                          desired_capabilities=caps)

# 放大,防止有的元素渲染完被覆盖点击不到
DRIVER.set_window_size(1920, 1080)

# 访问目标网站
DRIVER.get("https://xxxx.xxxx.com")

# 寻找元素id为xxxxx的元素并点击
DRIVER.find_element_by_id("xxxxx").click()

# js事件执行发送请求后浏览器弹窗下载,拿到日志记录
browser_log = DRIVER.get_log('performance')
browser_log.reverse()

for i in browser_log:
    if i.get('message'):
        message_dict = json.loads(i.get('message'))
        file_download_url = message_dict.get('message').get('params').get('url') if message_dict else None
        
print(file_download_url)

你可能感兴趣的:(爬虫)