Spaces:

minaewrw
/

mina-api

Paused

mina-api / tools /analyze_structure.py

Mina

Fresh deploy without large files

25ae7fe 5 months ago

1.24 kB

	from bs4 import BeautifulSoup
	import sys
	import io

	# Set encoding for Windows terminal
	if sys.platform == 'win32':
	sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf-8')

	def analyze_html():
	with open("flaresolverr_output.html", "r", encoding="utf-8") as f:
	html = f.read()

	soup = BeautifulSoup(html, 'html.parser')

	print("--- Analyzing Links ---")
	links = soup.find_all('a', href=True)
	for i, a in enumerate(links[:100]):
	href = a['href']
	text = a.get_text(strip=True)
	if 'cat=' in href or 'video' in href or 'movie' in href or 'series' in href:
	print(f"{i}: Text: {text} \| Href: {href}")

	print("\n--- Analyzing Containers ---")
	# Look for common patterns in classes
	classes = set()
	for tag in soup.find_all(True, class_=True):
	for c in tag['class']:
	classes.add(c)

	print(f"Found {len(classes)} unique classes.")
	# Print classes that might be containers
	potential = [c for c in classes if any(x in c.lower() for x in ['item', 'video', 'movie', 'thumb', 'card', 'block', 'col'])]
	print(f"Potential container classes: {potential}")

	if __name__ == "__main__":
	analyze_html()