notion / src /ProxyPool.js
clash-linux's picture
Upload 17 files
8c0c410 verified
import axios from 'axios';
/**
* 代理池类,用于管理和提供HTTP代理
*/
class ProxyPool {
/**
* 创建代理池实例
* @param {Object} options - 配置选项
* @param {number} options.targetCount - 目标代理数量,默认20
* @param {number} options.batchSize - 每次获取的代理数量,默认20
* @param {number} options.testTimeout - 测试代理超时时间(毫秒),默认5000
* @param {number} options.requestTimeout - 请求目标网站超时时间(毫秒),默认10000
* @param {string} options.targetUrl - 目标网站URL,默认'https://www.notion.so'
* @param {number} options.concurrentRequests - 并发请求数量,默认10
* @param {number} options.minThreshold - 可用代理数量低于此阈值时自动补充,默认5
* @param {number} options.checkInterval - 检查代理池状态的时间间隔(毫秒),默认30000
* @param {string} options.proxyProtocol - 代理协议,默认'http'
* @param {number} options.maxRefillAttempts - 最大补充尝试次数,默认20
* @param {number} options.retryDelay - 重试延迟(毫秒),默认1000
* @param {boolean} options.useCache - 是否使用缓存,默认true
* @param {number} options.cacheExpiry - 缓存过期时间(毫秒),默认3600000 (1小时)
*/
constructor(options = {}) {
// 配置参数
this.targetCount = options.targetCount || 20;
this.batchSize = options.batchSize || 20;
this.testTimeout = options.testTimeout || 5000;
this.requestTimeout = options.requestTimeout || 10000;
this.targetUrl = options.targetUrl || 'https://www.notion.so';
this.concurrentRequests = options.concurrentRequests || 10;
this.minThreshold = options.minThreshold || 5;
this.checkInterval = options.checkInterval || 30000; // 默认30秒检查一次
this.proxyProtocol = options.proxyProtocol || 'http';
this.maxRefillAttempts = options.maxRefillAttempts || 20; // 减少最大尝试次数
this.retryDelay = options.retryDelay || 1000; // 减少重试延迟
this.useCache = options.useCache !== undefined ? options.useCache : true;
this.cacheExpiry = options.cacheExpiry || 3600000; // 默认1小时
// 内部状态
this.availableProxies = [];
this.currentIndex = 0;
this.isInitialized = false;
this.isRefilling = false;
this.checkTimer = null;
this.proxyCache = new Map(); // 缓存验证过的代理
// 绑定方法
this.getProxy = this.getProxy.bind(this);
this.removeProxy = this.removeProxy.bind(this);
this.checkAndRefill = this.checkAndRefill.bind(this);
}
/**
* 初始化代理池
* @returns {Promise<void>}
*/
async initialize() {
if (this.isInitialized) return;
console.log(`初始化代理池,目标数量: ${this.targetCount}`);
await this.refillProxies();
// 设置定时检查
this.checkTimer = setInterval(this.checkAndRefill, this.checkInterval);
this.isInitialized = true;
console.log(`代理池初始化完成,当前可用代理数量: ${this.availableProxies.length}`);
}
/**
* 停止代理池服务
*/
stop() {
if (this.checkTimer) {
clearInterval(this.checkTimer);
this.checkTimer = null;
}
console.log('代理池服务已停止');
}
/**
* 检查并补充代理
*/
async checkAndRefill() {
if (this.availableProxies.length <= this.minThreshold && !this.isRefilling) {
console.log(`可用代理数量(${this.availableProxies.length})低于阈值(${this.minThreshold}),开始补充代理`);
await this.refillProxies();
}
}
/**
* 补充代理到目标数量
* @returns {Promise<void>}
*/
async refillProxies() {
if (this.isRefilling) return;
this.isRefilling = true;
console.log(`开始补充代理,当前数量: ${this.availableProxies.length},目标数量: ${this.targetCount}`);
let attempts = 0;
try {
// 计算需要补充的代理数量
const neededProxies = this.targetCount - this.availableProxies.length;
// 优先检查缓存中的代理
if (this.useCache && this.proxyCache.size > 0) {
await this.tryUsingCachedProxies(neededProxies);
}
// 如果缓存中的代理不足,继续获取新代理
while (this.availableProxies.length < this.targetCount && attempts < this.maxRefillAttempts) {
attempts++;
console.log(`补充尝试 #${attempts},当前可用代理: ${this.availableProxies.length}/${this.targetCount}`);
// 计算本次需要获取的批次大小
const remainingNeeded = this.targetCount - this.availableProxies.length;
const batchSizeNeeded = Math.max(this.batchSize, remainingNeeded * 2); // 获取更多代理以提高成功率
// 获取代理
const proxies = await this.getProxiesFromProvider(batchSizeNeeded);
if (proxies.length === 0) {
console.log(`没有获取到代理,等待${this.retryDelay/1000}秒后重试...`);
await new Promise(resolve => setTimeout(resolve, this.retryDelay));
continue;
}
// 过滤掉已有的代理
const newProxies = this.filterExistingProxies(proxies);
if (newProxies.length === 0) {
console.log('所有获取的代理都已存在,继续获取新代理...');
continue;
}
// 测试代理
const results = await this.testProxiesConcurrently(newProxies);
// 添加可用代理
this.addValidProxies(results);
// 如果已经获取到足够的代理,提前结束
if (this.availableProxies.length >= this.targetCount) {
break;
}
// 如果还没补充到足够的代理,等待一段时间再继续
if (this.availableProxies.length < this.targetCount) {
await new Promise(resolve => setTimeout(resolve, this.retryDelay));
}
}
} catch (error) {
console.error('补充代理过程中出错:', error);
} finally {
this.isRefilling = false;
if (this.availableProxies.length >= this.targetCount) {
console.log(`代理补充完成,当前可用代理: ${this.availableProxies.length}/${this.targetCount}`);
} else {
console.log(`已达到最大尝试次数 ${this.maxRefillAttempts},当前可用代理: ${this.availableProxies.length}/${this.targetCount}`);
}
}
}
/**
* 尝试使用缓存中的代理
* @param {number} neededProxies - 需要的代理数量
*/
async tryUsingCachedProxies(neededProxies) {
const now = Date.now();
const cachedProxies = [];
// 筛选未过期的缓存代理
for (const [proxyKey, data] of this.proxyCache.entries()) {
if (now - data.timestamp < this.cacheExpiry && data.valid) {
cachedProxies.push(proxyKey);
if (cachedProxies.length >= neededProxies) {
break;
}
}
}
if (cachedProxies.length > 0) {
console.log(`从缓存中找到 ${cachedProxies.length} 个可能可用的代理`);
// 验证缓存的代理是否仍然可用
const results = await this.testProxiesConcurrently(cachedProxies);
this.addValidProxies(results);
}
}
/**
* 过滤掉已存在的代理
* @param {Array<string>} proxies - 代理列表
* @returns {Array<string>} - 新代理列表
*/
filterExistingProxies(proxies) {
return proxies.filter(proxy => {
const [ip, port] = proxy.split(':');
return !this.availableProxies.some(p => p.ip === ip && p.port === port);
});
}
/**
* 添加有效的代理到代理池
* @param {Array<{proxy: string, result: boolean}>} results - 测试结果
*/
addValidProxies(results) {
for (const { proxy, result } of results) {
if (result) {
const [ip, port] = proxy.split(':');
// 检查是否已存在
if (!this.availableProxies.some(p => p.ip === ip && p.port === port)) {
const proxyObj = {
ip,
port,
protocol: this.proxyProtocol,
full: `${this.proxyProtocol}://${proxy}`,
addedAt: new Date().toISOString()
};
this.availableProxies.push(proxyObj);
// 添加到缓存
if (this.useCache) {
this.proxyCache.set(proxy, {
valid: true,
timestamp: Date.now()
});
}
console.log(`成功添加代理: ${proxyObj.full},当前可用代理: ${this.availableProxies.length}/${this.targetCount}`);
if (this.availableProxies.length >= this.targetCount) {
break;
}
}
} else if (this.useCache) {
// 记录无效代理到缓存
this.proxyCache.set(proxy, {
valid: false,
timestamp: Date.now()
});
}
}
}
/**
* 从代理服务获取代理URL
* @param {number} count - 请求的代理数量
* @returns {Promise<Array<string>>} - 代理URL列表
*/
async getProxiesFromProvider(count = null) {
try {
console.log(`使用自定义代理服务器`);
// 直接返回配置的代理
return ['34.55.224.190:8080'];
} catch (error) {
console.error('获取代理出错:', error.message);
return [];
}
}
/**
* 并发测试多个代理
* @param {Array<string>} proxies - 代理列表
* @returns {Promise<Array<{proxy: string, result: boolean}>>} - 测试结果
*/
async testProxiesConcurrently(proxies) {
const results = [];
const remainingNeeded = this.targetCount - this.availableProxies.length;
// 增加并发数以加快处理速度
const concurrentRequests = Math.min(this.concurrentRequests * 2, 20);
// 分批处理代理
for (let i = 0; i < proxies.length; i += concurrentRequests) {
const batch = proxies.slice(i, i + concurrentRequests);
const promises = batch.map(proxy => {
// 检查缓存中是否有近期验证过的结果
if (this.useCache && this.proxyCache.has(proxy)) {
const cachedResult = this.proxyCache.get(proxy);
const isFresh = (Date.now() - cachedResult.timestamp) < this.cacheExpiry;
if (isFresh) {
// 使用缓存结果,避免重复测试
return Promise.resolve({ proxy, result: cachedResult.valid });
}
}
return this.testProxy(proxy)
.then(result => ({ proxy, result }))
.catch(() => ({ proxy, result: false }));
});
const batchResults = await Promise.all(promises);
results.push(...batchResults);
// 如果已经找到足够的代理,提前结束测试
const successCount = results.filter(item => item.result).length;
if (successCount >= remainingNeeded) {
break;
}
}
return results;
}
/**
* 测试代理是否可用
* @param {string} proxyUrl - 代理URL
* @returns {Promise<boolean>} - 代理是否可用
*/
async testProxy(proxyUrl) {
try {
// 创建代理配置
const proxyConfig = {
host: proxyUrl.split(':')[0],
port: parseInt(proxyUrl.split(':')[1]),
protocol: this.proxyProtocol
};
// 发送请求到目标网站
const response = await axios.get(this.targetUrl, {
proxy: proxyConfig,
headers: {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'Accept-Language': 'en-US,en;q=0.5',
'Connection': 'keep-alive',
'Upgrade-Insecure-Requests': '1'
},
timeout: this.requestTimeout,
validateStatus: status => true,
maxRedirects: 10,
followRedirect: true
});
// 检查响应是否包含目标网站特有的内容
const isTargetContent = response.data &&
(typeof response.data === 'string') &&
(response.data.includes('notion') ||
response.data.includes('Notion'));
const isValid = response.status === 200 && isTargetContent;
if (isValid) {
console.log(`代理 ${proxyUrl} 请求目标网站成功,状态码: ${response.status}`);
} else {
console.log(`代理 ${proxyUrl} 请求目标网站失败,状态码: ${response.status}`);
}
return isValid;
} catch (error) {
console.log(`代理 ${proxyUrl} 请求出错: ${error.message}`);
return false;
}
}
/**
* 获取一个可用代理
* @returns {Object|null} - 代理对象,如果没有可用代理则返回null
*/
getProxy() {
if (this.availableProxies.length === 0) {
console.log('没有可用代理');
return null;
}
// 轮询方式获取代理
const proxy = this.availableProxies[this.currentIndex];
this.currentIndex = (this.currentIndex + 1) % this.availableProxies.length;
return proxy;
}
/**
* 移除指定代理
* @param {string} ip - 代理IP
* @param {string|number} port - 代理端口
* @returns {boolean} - 是否成功移除
*/
removeProxy(ip, port) {
const portStr = port.toString();
const initialLength = this.availableProxies.length;
// 找到要移除的代理
const proxyToRemove = this.availableProxies.find(
proxy => proxy.ip === ip && proxy.port === portStr
);
if (proxyToRemove) {
// 更新缓存,标记为无效
if (this.useCache) {
const proxyKey = `${ip}:${portStr}`;
this.proxyCache.set(proxyKey, { valid: false, timestamp: Date.now() });
}
}
this.availableProxies = this.availableProxies.filter(
proxy => !(proxy.ip === ip && proxy.port === portStr)
);
// 重置当前索引,确保不会越界
if (this.currentIndex >= this.availableProxies.length && this.availableProxies.length > 0) {
this.currentIndex = 0;
}
const removed = initialLength > this.availableProxies.length;
if (removed) {
console.log(`已移除代理 ${ip}:${port},当前可用代理: ${this.availableProxies.length}`);
} else {
console.log(`未找到要移除的代理 ${ip}:${port}`);
}
// 如果移除后代理数量低于阈值,触发补充
this.checkAndRefill();
return removed;
}
/**
* 获取所有可用代理
* @returns {Array<Object>} - 代理对象数组
*/
getAllProxies() {
return [...this.availableProxies];
}
/**
* 获取可用代理数量
* @returns {number} - 代理数量
*/
getCount() {
return this.availableProxies.length;
}
/**
* 清理过期的缓存条目
*/
cleanupCache() {
if (!this.useCache) return;
const now = Date.now();
let cleanupCount = 0;
for (const [key, data] of this.proxyCache.entries()) {
if (now - data.timestamp > this.cacheExpiry) {
this.proxyCache.delete(key);
cleanupCount++;
}
}
if (cleanupCount > 0) {
console.log(`清理了 ${cleanupCount} 个过期的缓存代理`);
}
}
}
// 使用示例
async function example() {
// 创建代理池实例
const proxyPool = new ProxyPool({
targetCount: 10, // 目标保持10个代理
minThreshold: 3, // 当可用代理少于3个时,自动补充
checkInterval: 60000, // 每60秒检查一次
targetUrl: 'https://www.notion.so',
concurrentRequests: 15, // 增加并发请求数
useCache: true, // 启用缓存
maxRefillAttempts: 15, // 减少最大尝试次数
retryDelay: 1000 // 减少重试延迟
});
// 初始化代理池
await proxyPool.initialize();
// 获取一个代理
const proxy = proxyPool.getProxy();
console.log('获取到代理:', proxy);
// 模拟使用一段时间后,移除一个代理
setTimeout(() => {
if (proxy) {
proxyPool.removeProxy(proxy.ip, proxy.port);
}
// 获取所有代理
const allProxies = proxyPool.getAllProxies();
console.log(`当前所有代理(${allProxies.length}):`, allProxies);
// 使用完毕后停止服务
setTimeout(() => {
proxyPool.stop();
console.log('代理池示例运行完毕');
}, 5000);
}, 5000);
}
// 如果直接运行此文件,则执行示例
if (typeof require !== 'undefined' && require.main === module) {
example().catch(err => console.error('示例运行出错:', err));
}
// 导出 ProxyPool 类和实例
export default ProxyPool;
export const proxyPool = new ProxyPool();