Spaces:

Harisri
/

FLOOR2MODEL

Sleeping

FLOOR2MODEL / src /segmentation /trainer.py

Harisri

Purged CV model deployment

fc895f4 23 days ago

8.45 kB

	"""
	trainer.py
	----------
	YOLOv8 segmentation trainer for floor plan element detection.

	Automatically selects the best available device:
	- Apple Silicon (M1/M2/M3/M4): uses MPS
	- NVIDIA GPU: uses CUDA
	- Fallback: CPU

	Usage:
	from src.segmentation.trainer import SegmentationTrainer

	trainer = SegmentationTrainer(dataset_yaml="data/yolo_dataset/dataset.yaml")
	trainer.train()
	trainer.export()
	"""

	import os
	import platform
	from pathlib import Path
	from typing import Optional

	import torch


	# ── Device detection ──────────────────────────────────────────────────────────

	def get_best_device() -> str:
	"""
	Returns the best available device string for PyTorch / Ultralytics.
	Priority: MPS (Apple Silicon) > CUDA (if compatible) > CPU
	"""
	if torch.backends.mps.is_available():
	print("Device: Apple Silicon MPS (GPU accelerated)")
	return "mps"
	elif torch.cuda.is_available():
	# Check CUDA compute capability — RTX 5060 (sm_120) not supported by older PyTorch
	major, minor = torch.cuda.get_device_capability(0)
	sm = major * 10 + minor
	supported = [50, 60, 61, 70, 75, 80, 86, 90]
	if sm in supported:
	gpu = torch.cuda.get_device_name(0)
	print(f"Device: CUDA — {gpu}")
	return "0"
	else:
	gpu = torch.cuda.get_device_name(0)
	print(f"Device: CPU (GPU {gpu} sm_{sm} not supported by this PyTorch build)")
	return "cpu"
	else:
	print("Device: CPU (training will be slow — consider Colab)")
	return "cpu"


	# ── Trainer ───────────────────────────────────────────────────────────────────

	class SegmentationTrainer:
	"""
	Wraps Ultralytics YOLOv8 for floor plan segmentation training.

	Args:
	dataset_yaml: Path to the dataset.yaml generated by CubiCasaDataset.
	model_size: YOLOv8 model variant: 'n' (nano), 's' (small), 'm' (medium).
	For M4 MacBook Air, 's' is the sweet spot.
	output_dir: Where to save training runs.
	epochs: Number of training epochs.
	batch_size: Batch size. Use 8-16 for MPS, 4-8 for CPU.
	img_size: Input image size for training.
	device: Override device ('mps', 'cpu', '0'). Auto-detected if None.
	"""

	# Model weight files (downloaded automatically on first run)
	MODEL_WEIGHTS = {
	"n": "yolov8n-seg.pt", # 3.4M params — fastest
	"s": "yolov8s-seg.pt", # 11.8M params — recommended for M4
	"m": "yolov8m-seg.pt", # 27.3M params — most accurate
	}

	def __init__(
	self,
	dataset_yaml: str,
	model_size: str = "s",
	output_dir: str = "models/segmentation",
	epochs: int = 100,
	batch_size: int = 8,
	img_size: int = 640,
	device: Optional[str] = None,
	pretrained: bool = True,
	):
	self.dataset_yaml = Path(dataset_yaml)
	self.model_size = model_size
	self.output_dir = Path(output_dir)
	self.epochs = epochs
	self.batch_size = batch_size
	self.img_size = img_size
	self.device = device or get_best_device()
	self.pretrained = pretrained
	self.model = None

	if model_size not in self.MODEL_WEIGHTS:
	raise ValueError(
	f"model_size must be one of {list(self.MODEL_WEIGHTS.keys())}"
	)
	if not self.dataset_yaml.exists():
	raise FileNotFoundError(f"Dataset YAML not found: {dataset_yaml}")

	def train(self) -> str:
	"""
	Start YOLOv8 training.

	Returns:
	Path to the best model weights file.
	"""
	from ultralytics import YOLO

	weights = self.MODEL_WEIGHTS[self.model_size]
	print(f"\nStarting training:")
	print(f" Model: YOLOv8{self.model_size}-seg ({weights})")
	print(f" Dataset: {self.dataset_yaml}")
	print(f" Device: {self.device}")
	print(f" Epochs: {self.epochs}")
	print(f" Batch: {self.batch_size}")
	print(f" Img size:{self.img_size}")
	print()

	self.model = YOLO(weights)

	results = self.model.train(
	data=str(self.dataset_yaml),
	epochs=self.epochs,
	batch=self.batch_size,
	imgsz=self.img_size,
	device=self.device,
	project=str(self.output_dir),
	name="floor_plan_seg",
	# Augmentation — essential for floor plans
	augment=True,
	degrees=10.0, # Random rotation ±10°
	translate=0.1, # Random translation
	scale=0.5, # Random scale
	fliplr=0.5, # Horizontal flip
	flipud=0.0, # No vertical flip (plans are top-down)
	# Optimizer settings
	optimizer="AdamW",
	lr0=0.001,
	lrf=0.01,
	weight_decay=0.0005,
	warmup_epochs=3,
	# Save settings
	save=True,
	save_period=10, # Save checkpoint every 10 epochs
	patience=30, # Early stopping patience
	# Logging
	verbose=True,
	plots=True,
	)

	best_weights = (
	Path(results.save_dir) / "weights" / "best.pt"
	)
	print(f"\nTraining complete. Best weights: {best_weights}")
	return str(best_weights)

	def resume(self, checkpoint_path: str) -> str:
	"""Resume training from a checkpoint."""
	from ultralytics import YOLO
	print(f"Resuming from checkpoint: {checkpoint_path}")
	self.model = YOLO(checkpoint_path)
	results = self.model.train(resume=True)
	return str(Path(results.save_dir) / "weights" / "best.pt")

	def validate(self, weights_path: Optional[str] = None) -> dict:
	"""
	Run validation on the test set.

	Returns:
	Dictionary of evaluation metrics (mAP50, mAP50-95, etc.)
	"""
	from ultralytics import YOLO

	if weights_path:
	model = YOLO(weights_path)
	elif self.model:
	model = self.model
	else:
	raise ValueError(
	"No model loaded. Run train() first or pass weights_path."
	)

	metrics = model.val(
	data=str(self.dataset_yaml),
	device=self.device,
	split="test",
	)

	print("\nValidation results:")
	print(f" mAP50: {metrics.seg.map50:.4f}")
	print(f" mAP50-95: {metrics.seg.map:.4f}")
	return {
	"map50": metrics.seg.map50,
	"map50_95": metrics.seg.map,
	}

	def export(
	self,
	weights_path: Optional[str] = None,
	format: str = "onnx",
	) -> str:
	"""
	Export trained model for production deployment.

	Args:
	weights_path: Path to best.pt. Uses last trained model if None.
	format: Export format: 'onnx', 'coreml' (Apple), 'torchscript'.

	Returns:
	Path to exported model file.
	"""
	from ultralytics import YOLO

	if weights_path:
	model = YOLO(weights_path)
	elif self.model:
	model = self.model
	else:
	raise ValueError("No model to export. Run train() first.")

	print(f"Exporting model to {format.upper()} format...")

	# CoreML is best for on-device M4 inference
	if format == "coreml":
	path = model.export(
	format="coreml",
	imgsz=self.img_size,
	nms=True,
	)
	else:
	path = model.export(
	format=format,
	imgsz=self.img_size,
	dynamic=True,
	simplify=True,
	)

	print(f"Exported: {path}")
	return str(path)