Spaces:

rethinks
/

childYb

Running

App Files Files Community

childYb / test_single_month.py

rethinks

Upload 6 files

00e6a0c verified 27 days ago

raw

history blame contribute delete

4.7 kB

	"""
	Test script: Select best 40 photos from a single month folder.
	Usage: python test_single_month.py <folder_path> [target_count]

	Example:
	python test_single_month.py "C:/Photos/2024/January" 40
	"""

	import sys
	import os
	from pathlib import Path

	# Add project to path
	sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))

	from photo_selector.monthly_selector import MonthlyPhotoSelector


	def test_single_month(folder_path: str, target: int = 40):
	"""
	Test photo selection on a single folder.

	Args:
	folder_path: Path to folder containing photos
	target: Number of photos to select (default 40)
	"""
	folder = Path(folder_path)

	if not folder.exists():
	print(f"Error: Folder not found: {folder}")
	return

	# Count photos
	extensions = {'.jpg', '.jpeg', '.png', '.heic', '.heif', '.webp'}
	photos = [f for f in folder.iterdir() if f.suffix.lower() in extensions]

	print(f"\n{'='*60}")
	print(f"SINGLE MONTH TEST")
	print(f"{'='*60}")
	print(f"Folder: {folder}")
	print(f"Photos found: {len(photos)}")
	print(f"Target selection: {target}")
	print(f"{'='*60}\n")

	if len(photos) == 0:
	print("No photos found in folder!")
	return

	# Initialize selector
	print("Initializing selector (loading CLIP model)...")
	selector = MonthlyPhotoSelector()

	# Step 1: Generate embeddings
	print(f"\n[Step 1] Generating CLIP embeddings for {len(photos)} photos...")
	photo_paths = [str(p) for p in photos]
	embeddings = selector.generate_embeddings(photo_paths)
	print(f"Generated embeddings for {len(embeddings)} photos")

	# Step 2: Score photos
	print(f"\n[Step 2] Scoring photos...")
	from photo_selector.scoring import PhotoScorer
	scorer = PhotoScorer()

	scored_photos = []
	for i, photo_path in enumerate(photo_paths):
	if (i + 1) % 10 == 0:
	print(f" Scoring {i + 1}/{len(photo_paths)}...")

	filename = Path(photo_path).name
	emb = embeddings.get(filename)

	# Get scores
	scores = scorer.score_photo(photo_path)

	scored_photos.append({
	'filename': filename,
	'filepath': photo_path,
	'total': scores.get('total', 0),
	'face_quality': scores.get('face_quality', 0),
	'aesthetic_quality': scores.get('aesthetic_quality', 0),
	'emotional_signal': scores.get('emotional_signal', 0),
	'uniqueness': scores.get('uniqueness', 0.5),
	'num_faces': scores.get('num_faces', 0)
	})

	print(f"Scored {len(scored_photos)} photos")

	# Step 3: Cluster and select using HDBSCAN
	print(f"\n[Step 3] Running HDBSCAN clustering and selection...")
	selected = selector.select_hybrid_hdbscan(
	scored_photos,
	embeddings,
	target=target
	)

	# Results
	print(f"\n{'='*60}")
	print(f"RESULTS")
	print(f"{'='*60}")
	print(f"Total photos: {len(photos)}")
	print(f"Selected: {len(selected)}")
	print(f"{'='*60}\n")

	# Show selected photos
	print("Selected photos (ranked by score):\n")
	print(f"{'#':<4} {'Score':>6} {'Faces':>6} {'Cluster':>8} {'Similarity':>10} {'Filename':<40}")
	print("-" * 80)

	for i, photo in enumerate(selected, 1):
	score = photo.get('total', 0) * 100
	faces = photo.get('num_faces', 0)
	cluster = photo.get('cluster_id', -1)
	cluster_label = f"C{cluster}" if cluster >= 0 else "Fallback"
	similarity = photo.get('max_similarity', 0) * 100
	filename = photo.get('filename', '?')[:38]

	print(f"{i:<4} {score:>5.1f}% {faces:>6} {cluster_label:>8} {similarity:>9.1f}% {filename:<40}")

	# Cluster distribution
	print(f"\n{'='*60}")
	print("CLUSTER DISTRIBUTION")
	print(f"{'='*60}")

	cluster_counts = {}
	for photo in selected:
	cid = photo.get('cluster_id', -1)
	cluster_counts[cid] = cluster_counts.get(cid, 0) + 1

	for cid in sorted(cluster_counts.keys()):
	label = f"Cluster {cid}" if cid >= 0 else "Fallback"
	count = cluster_counts[cid]
	bar = "█" * count
	print(f" {label:<12}: {count:>3} {bar}")

	print(f"\n{'='*60}")

	return selected


	if __name__ == "__main__":
	if len(sys.argv) < 2:
	print(__doc__)
	print("\nNo folder provided. Please specify a folder path.")
	sys.exit(1)

	folder_path = sys.argv[1]
	target = int(sys.argv[2]) if len(sys.argv) > 2 else 40

	test_single_month(folder_path, target)