selenium如何打开网页下载网页所有静态资源文件js css image等?
网友回复
附上示例代码:
import socket
import select
import threading
import requests
import os
from urllib.parse import urlparse, urljoin
# 代理服务器监听IP和端口
host = "127.0.0.1"
port = 8081
# 最大连接数
max_connections = 100
# 缓存大小
buffer_size = 4096
# 初始化代理服务器
proxy_server = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
proxy_server.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
proxy_server.bind((host, port))
proxy_server.listen(max_connections)
print(f"代理服务器已启动,监听地址:{host}:{port}")
def download_file(url, folder,headers):
# 获取网页URL的路径和文件名
parsed_url = urlparse(url)
path_parts = parsed_url.path.split("/")
if path_parts[-1] == "":
filename = "index.html"
else:
filename = path_parts[-1]
# 获取本地文件路径
local_path = os.path.join(folder, *path_parts[1:-1])
if not os.path.exists(local_path):
os...点击查看剩余70%


