Spaces:

stnh70
/

vid

Sleeping

App Files Files Community

stnh70 commited on Aug 20, 2025

Commit

3938f5e

verified ·

1 Parent(s): 67172ad

Update server.js

Browse files

Files changed (1) hide show

server.js +176 -2

server.js CHANGED Viewed

@@ -49,7 +49,7 @@ async function extractFirstIframeSrc(page, domain) {
     }
 }
-async function getVideoAndSubtitles(finalUrl) {
     try {
         const response = await fetch(finalUrl);
         if (!response.ok) {
@@ -92,10 +92,70 @@ async function getVideoAndSubtitles(finalUrl) {
     }
 }
 // 修改 scrapeProvider 函数
 // 在 scrapeProvider 函数中添加调试代码
-async function scrapeProvider(domain, url, signal) {
     if (signal.aborted) throw new Error('Aborted');
     console.log(`\n[${domain}] Starting scrape for URL: ${url}`);
@@ -179,6 +239,120 @@ async function scrapeProvider(domain, url, signal) {
     }
 }
 // 修改 handleSpecificTurnstile 函数
 async function handleSpecificTurnstile(page, domain) {
     try {

     }
 }
+async function getVideoAndSubtitles_(finalUrl) {
     try {
         const response = await fetch(finalUrl);
         if (!response.ok) {
     }
 }
+async function getVideoAndSubtitles(url) {
+    console.log(`[getVideoAndSubtitles] Processing URL: ${url}`);
+    // 如果是 cloudnestra.com/rcp/ 的URL，直接返回解析结果
+    if (url.includes('cloudnestra.com/rcp/')) {
+        try {
+            const response = await fetch(url);
+            const text = await response.text();
+            // 尝试解析JSON
+            try {
+                const data = JSON.parse(text);
+                if (data.file) {
+                    console.log(`[getVideoAndSubtitles] Found video URL in cloudnestra response:`, data.file);
+                    return {
+                        videoFileUrl: data.file,
+                        subtitleSources: data.subtitles || []
+                    };
+                }
+            } catch (e) {
+                // 如果不是JSON，尝试查找m3u8链接
+                const m3u8Match = text.match(/https?:\/\/[^\s"']+\.m3u8[^\s"']*/);
+                if (m3u8Match) {
+                    console.log(`[getVideoAndSubtitles] Found m3u8 URL in cloudnestra response:`, m3u8Match[0]);
+                    return {
+                        videoFileUrl: m3u8Match[0],
+                        subtitleSources: []
+                    };
+                }
+            }
+            throw new Error("No video URL found in cloudnestra response");
+        } catch (error) {
+            console.error(`[getVideoAndSubtitles] Error fetching cloudnestra response:`, error);
+            throw error;
+        }
+    }
+    // 原有的处理逻辑
+    try {
+        const response = await fetch(url);
+        const html = await response.text();
+        const videoMatch = html.match(/file:\s*["']([^"']+\.m3u8[^"']*)["']/);
+        const subtitleMatch = html.match(/tracks:\s*\[\s*{[^}]*}\s*\]/);
+        if (!videoMatch || !videoMatch[1]) {
+            throw new Error("HLS URL not found");
+        }
+        const videoFileUrl = videoMatch[1];
+        const subtitleSources = subtitleMatch ? [JSON.parse(subtitleMatch[0])] : [];
+        return { videoFileUrl, subtitleSources };
+    } catch (error) {
+        console.error(`[getVideoAndSubtitles] Error processing URL:`, error);
+        throw error;
+    }
+}
 // 修改 scrapeProvider 函数
 // 在 scrapeProvider 函数中添加调试代码
+async function scrapeProvider_(domain, url, signal) {
     if (signal.aborted) throw new Error('Aborted');
     console.log(`\n[${domain}] Starting scrape for URL: ${url}`);
     }
 }
+async function scrapeProvider(domain, url, signal) {
+    if (signal.aborted) throw new Error('Aborted');
+    console.log(`\n[${domain}] Starting scrape for URL: ${url}`);
+    let browserInstance = null;
+    try {
+        browserInstance = await browserPool.get();
+        const browser = browserInstance.browser;
+        // 创建初始页面
+        const page = await browser.newPage();
+        // 启用请求拦截
+        await page.route('**/*', route => {
+            const requestUrl = route.request().url();
+            console.log(`[${domain}] Request: ${requestUrl}`);
+            // 如果是 cloudnestra.com/rcp/ 的请求，记录响应但不拦截
+            if (requestUrl.includes('cloudnestra.com/rcp/')) {
+                route.continue().then(response => {
+                    response.text().then(text => {
+                        console.log(`[${domain}] Cloudnestra response:`, text);
+                        // 将响应保存到页面属性中
+                        page.cloudnestraResponse = text;
+                    });
+                });
+            } else {
+                route.continue();
+            }
+        });
+        await page.goto(url, {
+            waitUntil: 'networkidle',
+            timeout: 60000
+        });
+        // 检查是否有Turnstile
+        const hasTurnstile = await page.evaluate(() => {
+            return document.querySelector('.cf-turnstile') !== null;
+        });
+        console.log(`[${domain}] Has Turnstile: ${hasTurnstile}`);
+        // 处理Turnstile
+        if (hasTurnstile) {
+            await handleSpecificTurnstile(page, domain);
+        }
+        // 获取第一个iframe的URL
+        const firstIframeSrc = await extractFirstIframeSrc(page, domain);
+        if (!firstIframeSrc) throw new Error('First iframe not found');
+        // 创建新页面来加载iframe内容
+        const iframePage = await browser.newPage();
+        await iframePage.goto(firstIframeSrc, {
+            waitUntil: 'networkidle',
+            timeout: 60000
+        });
+        // 处理可能存在的第二个Turnstile
+        const iframeHasTurnstile = await iframePage.evaluate(() => {
+            return document.querySelector('.cf-turnstile') !== null;
+        });
+        console.log(`[${domain}] Iframe has Turnstile: ${iframeHasTurnstile}`);
+        if (iframeHasTurnstile) {
+            await handleSpecificTurnstile(iframePage, domain);
+        }
+        // 获取最终iframe的URL
+        const finalIframeSrc = await extractFinalIframeSrc(iframePage, domain);
+        if (!finalIframeSrc) throw new Error('Final iframe not found');
+        // 检查是否是 cloudnestra.com/rcp/ 的URL
+        if (finalIframeSrc.includes('cloudnestra.com/rcp/')) {
+            // 使用保存的响应
+            const responseText = page.cloudnestraResponse;
+            if (!responseText) throw new Error('No cloudnestra response found');
+            // 解析响应
+            try {
+                const data = JSON.parse(responseText);
+                if (data.file) {
+                    console.log(`[${domain}] Found video URL in cloudnestra response:`, data.file);
+                    return {
+                        source_domain: domain,
+                        hls_url: data.file,
+                        subtitles: data.subtitles || [],
+                        error: null
+                    };
+                }
+                throw new Error("No video URL found in cloudnestra response");
+            } catch (e) {
+                throw new Error("Failed to parse cloudnestra response");
+            }
+        }
+        // 如果不是 cloudnestra.com/rcp/ 的URL，使用原有的处理方式
+        const { videoFileUrl, subtitleSources } = await getVideoAndSubtitles(finalIframeSrc);
+        if (!videoFileUrl) throw new Error("HLS URL not found");
+        return { source_domain: domain, hls_url: videoFileUrl, subtitles: subtitleSources, error: null };
+    } catch (error) {
+        console.error(`[${domain}] Error in scrapeProvider: ${error.message}`);
+        throw error;
+    } finally {
+        if (browserInstance) {
+            console.log(`[${domain}] Releasing browser ${browserInstance.id} back to pool.`);
+            await browserPool.release(browserInstance);
+        }
+    }
+}
 // 修改 handleSpecificTurnstile 函数
 async function handleSpecificTurnstile(page, domain) {
     try {