Spaces:

hassanshka
/

layout

Runtime error

App Files Files Community

layout / test_combined_models.py

hassanshka

Add test_combined_models.py and compare/ folder (excluding cvat_project_7_export and Annika 2 folders)

0a216c0 2 months ago

raw

history blame contribute delete

11 kB

	#!/usr/bin/env python3
	"""
	Script to combine predictions from three YOLO models:
	- best_emanuskript_segmentation.pt (segmentation model for manuscript elements)
	- best_catmus.pt (segmentation model for lines and zones)
	- best_zone_detection.pt (detection model for zones)

	WORKFLOW SUMMARY:
	================

	1. MODEL PREDICTIONS (run_model_predictions):
	- Runs each of the 3 models on the input image
	- Saves predictions to JSON files in separate folders
	- Emanuskript: detects manuscript elements (Main script, Plain initial, etc.)
	- Catmus: detects lines (DefaultLine, InterlinearLine)
	- Zone: detects zones (MainZone, DropCapitalZone, etc.)

	2. COMBINING & FILTERING (combine_and_filter_predictions):
	- Uses ImageBatch class to:
	a) Load all predictions from the 3 JSON files
	b) Unify class names (maps catmus/zone names to coco_class_mapping)
	c) Filter overlapping/conflicting annotations using spatial indexing
	d) Convert to COCO format
	- Only keeps classes defined in coco_class_mapping (25 classes total)

	3. OUTPUT:
	- COCO format JSON file with filtered annotations
	- Only contains classes from coco_class_mapping

	KEY CLASSES IN coco_class_mapping:
	- Main script black/coloured
	- Variant script black/coloured
	- Plain initial (coloured/highlighted/black)
	- Historiated, Inhabited, Embellished
	- Page Number, Quire Mark, Running header
	- Gloss, Illustrations, Column
	- Music, MusicZone, MusicLine
	- Border, Table, Diagram
	- GraphicZone

	The ImageBatch class handles:
	- Spatial overlap detection (removes duplicates)
	- Class name unification (catmus_zones_mapping)
	- Annotation filtering based on overlap thresholds
	"""

	import os
	import json
	import tempfile
	import shutil
	from pathlib import Path
	from ultralytics import YOLO
	import sys

	# Add current directory to path to import ImageBatch
	current_dir = os.path.dirname(os.path.abspath(__file__))
	PROJECT_ROOT = current_dir # This file is in the project root
	sys.path.insert(0, current_dir)

	try:
	from utils.image_batch_classes import ImageBatch, coco_class_mapping
	except ImportError as e:
	print(f"Warning: Could not import ImageBatch: {e}")
	print("Make sure all dependencies are installed (rtree, shapely, etc.)")
	ImageBatch = None

	def run_model_predictions(image_path, output_dir):
	"""Run all three models on the image and save predictions."""

	# Create output directories
	catmus_dir = os.path.join(output_dir, 'catmus')
	emanuskript_dir = os.path.join(output_dir, 'emanuskript')
	zone_dir = os.path.join(output_dir, 'zone')

	for dir_path in [catmus_dir, emanuskript_dir, zone_dir]:
	os.makedirs(dir_path, exist_ok=True)

	image_id = Path(image_path).stem

	print("=" * 60)
	print("Running Model Predictions")
	print("=" * 60)

	# 1. Emanuskript model
	print("\n[1/3] Running emanuskript segmentation model...")
	emanuskript_model_path = os.path.join(PROJECT_ROOT, "best_emanuskript_segmentation.pt")
	emanuskript_model = YOLO(emanuskript_model_path)
	emanuskript_classes = [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,20]
	emanuskript_results = emanuskript_model.predict(
	image_path,
	classes=emanuskript_classes,
	iou=0.3,
	device='cpu',
	augment=False,
	stream=False
	)
	emanuskript_path = f'{emanuskript_dir}/{image_id}.json'
	with open(emanuskript_path, 'w') as f:
	f.write(emanuskript_results[0].to_json())
	print(f" ✓ Saved to: {emanuskript_path}")
	del emanuskript_model
	del emanuskript_results

	# 2. Catmus model
	print("\n[2/3] Running catmus segmentation model...")
	catmus_model_path = os.path.join(PROJECT_ROOT, "best_catmus.pt")
	catmus_model = YOLO(catmus_model_path)
	catmus_classes = [1, 7] # DefaultLine and InterlinearLine
	catmus_results = catmus_model.predict(
	image_path,
	classes=catmus_classes,
	iou=0.3,
	device='cpu',
	augment=False,
	stream=False
	)
	catmus_path = f'{catmus_dir}/{image_id}.json'
	with open(catmus_path, 'w') as f:
	f.write(catmus_results[0].to_json())
	print(f" ✓ Saved to: {catmus_path}")
	del catmus_model
	del catmus_results

	# 3. Zone detection model
	print("\n[3/3] Running zone detection model...")
	zone_model_path = os.path.join(PROJECT_ROOT, "best_zone_detection.pt")
	zone_model = YOLO(zone_model_path)
	zone_results = zone_model.predict(
	image_path,
	device='cpu',
	iou=0.3,
	augment=False,
	stream=False
	)
	zone_path = f'{zone_dir}/{image_id}.json'
	with open(zone_path, 'w') as f:
	f.write(zone_results[0].to_json())
	print(f" ✓ Saved to: {zone_path}")
	del zone_model
	del zone_results

	return {
	'catmus': catmus_dir,
	'emanuskript': emanuskript_dir,
	'zone': zone_dir
	}


	def combine_and_filter_predictions(image_path, labels_folders, output_json_path=None):
	"""Combine predictions from all models and filter to coco_class_mapping classes."""

	print("\n" + "=" * 60)
	print("Combining and Filtering Predictions")
	print("=" * 60)

	if ImageBatch is None:
	print("\nERROR: ImageBatch class not available.")
	print("Please install missing dependencies:")
	print(" pip install rtree shapely")
	return None

	# Create a temporary folder with just the image file
	# ImageBatch.load_images() loads all files in the folder, so we need only images
	temp_image_dir = tempfile.mkdtemp()
	image_filename = os.path.basename(image_path)
	temp_image_path = os.path.join(temp_image_dir, image_filename)
	shutil.copy2(image_path, temp_image_path)

	# Create ImageBatch instance
	image_folder = temp_image_dir

	image_batch = ImageBatch(
	image_folder=image_folder,
	catmus_labels_folder=labels_folders['catmus'],
	emanuskript_labels_folder=labels_folders['emanuskript'],
	zone_labels_folder=labels_folders['zone']
	)

	# Load images
	print("\n[Step 1] Loading images...")
	image_batch.load_images()
	print(f" ✓ Loaded {len(image_batch.images)} image(s)")

	# Load annotations from all three models
	print("\n[Step 2] Loading annotations from all models...")
	image_batch.load_annotations()

	total_annotations = sum(len(img.annotations) for img in image_batch.images)
	print(f" ✓ Loaded {total_annotations} total annotations")

	# Unify names (maps catmus/zone names to coco_class_mapping names)
	print("\n[Step 3] Unifying class names...")
	image_batch.unify_names()

	# Filter annotations (removes overlapping/conflicting annotations)
	print("\n[Step 4] Filtering annotations...")
	for img in image_batch.images:
	filtered = img.filter_annotations()
	print(f" Image {img.filename}: {len(img.annotations)} -> {len(filtered)} annotations")

	# Get COCO format JSON
	print("\n[Step 5] Generating COCO format...")
	coco_json = image_batch.return_coco_file()

	# Filter to only classes in coco_class_mapping
	valid_category_ids = set(coco_class_mapping.values())

	filtered_annotations = [
	ann for ann in coco_json['annotations']
	if ann['category_id'] in valid_category_ids
	]

	coco_json['annotations'] = filtered_annotations

	# Update categories to only include valid ones
	coco_json['categories'] = [
	cat for cat in coco_json['categories']
	if cat['id'] in valid_category_ids
	]

	print(f" ✓ Final annotations: {len(filtered_annotations)}")
	print(f" ✓ Final categories: {len(coco_json['categories'])}")

	# Save to file if path provided
	if output_json_path:
	with open(output_json_path, 'w') as f:
	json.dump(coco_json, f, indent=2)
	print(f"\n ✓ Saved COCO JSON to: {output_json_path}")

	# Cleanup temporary image directory
	shutil.rmtree(temp_image_dir, ignore_errors=True)

	return coco_json


	def print_summary(coco_json):
	"""Print summary of results."""
	print("\n" + "=" * 60)
	print("Results Summary")
	print("=" * 60)

	# Category counts
	category_counts = {}
	for ann in coco_json['annotations']:
	cat_id = ann['category_id']
	category_counts[cat_id] = category_counts.get(cat_id, 0) + 1

	# Map category IDs to names
	id_to_name = {cat['id']: cat['name'] for cat in coco_json['categories']}

	print(f"\nTotal Annotations: {len(coco_json['annotations'])}")
	print(f"Total Categories: {len(coco_json['categories'])}")
	print(f"\nAnnotations per Category:")
	for cat_id in sorted(category_counts.keys()):
	name = id_to_name.get(cat_id, f"Unknown({cat_id})")
	count = category_counts[cat_id]
	print(f" {name:30s}: {count:4d}")


	def visualize_results(image_path, coco_json):
	"""Visualize the combined results on the image."""
	print("\n" + "=" * 60)
	print("Visualizing Results")
	print("=" * 60)

	try:
	from utils.image_batch_classes import ImageBatch
	import tempfile

	# Create temporary labels folders for visualization
	with tempfile.TemporaryDirectory() as temp_dir:
	# We need to recreate the ImageBatch with the combined results
	# For now, just show the COCO JSON structure
	print("\nTo visualize, you can:")
	print("1. Use the COCO JSON file with any COCO visualization tool")
	print("2. Load the JSON in your annotation tool")
	print("3. Use the ImageBatch.plot_annotations() method")

	except Exception as e:
	print(f"Visualization not available: {e}")


	def main():
	"""Main function to run the complete pipeline."""

	# Configuration
	image_path = "bnf-naf-10039__page-001-of-004.jpg"
	output_json = "combined_predictions.json"

	if not os.path.exists(image_path):
	print(f"Error: Image file not found: {image_path}")
	return

	# Create temporary directory for predictions
	with tempfile.TemporaryDirectory() as temp_dir:
	print(f"Using temporary directory: {temp_dir}")

	# Step 1: Run all three models
	labels_folders = run_model_predictions(image_path, temp_dir)

	# Step 2: Combine and filter predictions
	coco_json = combine_and_filter_predictions(
	image_path,
	labels_folders,
	output_json_path=output_json
	)

	# Step 3: Print summary
	print_summary(coco_json)

	# Step 4: Visualize (optional)
	visualize_results(image_path, coco_json)

	print("\n" + "=" * 60)
	print("Pipeline Complete!")
	print("=" * 60)
	print(f"\nOutput saved to: {output_json}")


	if __name__ == "__main__":
	main()