Spaces:

Ameya729
/

Tablet-defect-detection

Sleeping

App Files Files Community

Tablet-defect-detection / src /feature_extractor.py

Ameya729

Upload 474 files

56ec9ba verified 6 days ago

raw

history blame contribute delete

4.12 kB

	"""
	Feature extraction using pretrained ResNet backbone
	"""

	import torch
	import torch.nn as nn
	from torchvision.models import resnet18, ResNet18_Weights
	from typing import List, Dict
	import config


	class FeatureExtractor(nn.Module):
	"""Extract multi-scale features from ResNet backbone"""

	def __init__(self, backbone: str = "resnet18", layers: List[str] = None):
	"""
	Args:
	backbone: Backbone architecture name
	layers: List of layer names to extract features from
	"""
	super().__init__()

	if layers is None:
	layers = config.FEATURE_LAYERS

	self.layers = layers

	# Load pretrained ResNet
	if backbone == "resnet18":
	model = resnet18(weights=ResNet18_Weights.IMAGENET1K_V1)
	else:
	raise ValueError(f"Unsupported backbone: {backbone}")

	# Register hooks to extract intermediate features
	self.feature_maps = {}
	self.hooks = []

	for name, module in model.named_children():
	if name in self.layers:
	hook = module.register_forward_hook(self._get_hook(name))
	self.hooks.append(hook)

	# Keep only the feature extraction part (remove classifier)
	self.model = model
	self.model.eval()

	# Freeze all parameters
	for param in self.model.parameters():
	param.requires_grad = False

	def _get_hook(self, name: str):
	"""Create forward hook to capture intermediate features"""
	def hook(module, input, output):
	self.feature_maps[name] = output
	return hook

	def forward(self, x: torch.Tensor) -> Dict[str, torch.Tensor]:
	"""
	Extract features from multiple layers

	Args:
	x: Input tensor [B, 3, H, W]

	Returns:
	Dictionary mapping layer names to feature tensors
	"""
	self.feature_maps.clear()

	with torch.no_grad():
	_ = self.model(x)

	return self.feature_maps

	def get_feature_dimensions(self) -> Dict[str, int]:
	"""Get output dimensions for each layer"""
	dummy_input = torch.randn(1, 3, *config.IMAGE_SIZE)
	features = self.forward(dummy_input)

	dimensions = {}
	for name, feat in features.items():
	dimensions[name] = {
	'channels': feat.shape[1],
	'height': feat.shape[2],
	'width': feat.shape[3]
	}

	return dimensions

	def __del__(self):
	"""Remove hooks when object is destroyed"""
	for hook in self.hooks:
	hook.remove()


	def extract_embeddings(extractor: FeatureExtractor,
	x: torch.Tensor) -> torch.Tensor:
	"""
	Extract and concatenate multi-scale embeddings

	Args:
	extractor: Feature extractor model
	x: Input tensor [B, 3, H, W]

	Returns:
	Concatenated embeddings [B, D, H', W'] where D is total channels
	"""
	feature_maps = extractor(x)

	# Get target spatial dimensions from the largest feature map
	target_size = None
	for name in extractor.layers:
	feat = feature_maps[name]
	if target_size is None or (feat.shape[2] > target_size[0]):
	target_size = (feat.shape[2], feat.shape[3])

	# Resize all features to same spatial dimensions and concatenate
	aligned_features = []
	for name in extractor.layers:
	feat = feature_maps[name]
	if feat.shape[2:] != target_size:
	feat = torch.nn.functional.interpolate(
	feat, size=target_size, mode='bilinear', align_corners=False
	)
	aligned_features.append(feat)

	# Concatenate along channel dimension
	embeddings = torch.cat(aligned_features, dim=1)

	return embeddings