Spaces:

DefenseIntelligenceAgency
/

Project_Red_Sword

Runtime error

App Files Files Community

googlesprojectzero commited on Dec 18, 2024

Commit

8813c03

verified ·

1 Parent(s): 7c67c8f

Delete src/archive/archive_analyzer.py

Browse files

Files changed (1) hide show

src/archive/archive_analyzer.py +0 -65

src/archive/archive_analyzer.py DELETED Viewed

@@ -1,65 +0,0 @@
-import asyncio
-import aiohttp
-from bs4 import BeautifulSoup
-from urllib.parse import urljoin
-async def fetch_url(session, url, semaphore, timeout=10):
-    async with semaphore:
-        try:
-            async with session.get(url, timeout=timeout) as response:
-                return await response.text()
-        except asyncio.TimeoutError:
-            return {"error": "Request timed out"}
-        except aiohttp.ClientError as e:
-            return {"error": str(e)}
-async def analyze_sources(sources, concurrency=10):
-    semaphore = asyncio.Semaphore(concurrency)
-    tasks = [analyze_source(name, url, semaphore) for name, url in sources.items()]
-    return await asyncio.gather(*tasks)
-async def analyze_source(source_name, source_url, semaphore):
-    async with aiohttp.ClientSession() as session:
-        try:
-            html = await fetch_url(session, source_url, semaphore)
-            soup = BeautifulSoup(html, 'html.parser')
-            base_url = source_url
-            return {
-                "source": source_name,
-                "title": soup.title.string if soup.title else "No Title Found",
-                "links": [urljoin(base_url, a['href']) for a in soup.find_all('a', href=True)]
-            }
-        except Exception as e:
-            return {"source": source_name, "error": str(e)}
-if __name__ == "__main__":
-    sources = {
-        "Source A": "http://example.com",
-        "Source B": "http://example.org"
-    }
-    asyncio.run(analyze_sources(sources))
-# import asyncio
-# import aiohttp
-# from bs4 import BeautifulSoup
-# async def fetch_url(session, url):
-#    async with session.get(url) as response:
-#        return await response.text()
-# async def analyze_source(source_name, source_url):
-#    async with aiohttp.ClientSession() as session:
-#        try:
-#            html = await fetch_url(session, source_url)
-#            soup = BeautifulSoup(html, 'html.parser')
-#            return {
-#                "source": source_name,
-#                "title": soup.title.string if soup.title else "No Title Found",
-#                "links": [a['href'] for a in soup.find_all('a', href=True)]
-#            }
-#        except Exception as e:
-#            return {"source": source_name, "error": str(e)}
-# async def analyze_sources(sources):
-#    tasks = [analyze_source(name, url) for name, url in sources.items()]
-#    return await asyncio.gather(*tasks)