Spaces:

Neylton
/

acceptIN

Sleeping

App Files Files Community

Neylton commited on Jul 24, 2025

Commit

168169c

1 Parent(s): 5705ccc

Add utils folder with required modules

Browse files

Files changed (4) hide show

utils/__pycache__/data_utils.cpython-311.pyc +0 -0
utils/__pycache__/model_utils.cpython-311.pyc +0 -0
utils/data_utils.py +388 -0
utils/model_utils.py +294 -0

utils/__pycache__/data_utils.cpython-311.pyc ADDED Viewed

Binary file (18.7 kB). View file

utils/__pycache__/model_utils.cpython-311.pyc ADDED Viewed

Binary file (14.2 kB). View file

utils/data_utils.py ADDED Viewed

	@@ -0,0 +1,388 @@

+"""
+Data utilities for telecom site classification
+Handles data loading, transformations, and dataset management
+"""
+import os
+import torch
+from torch.utils.data import Dataset, DataLoader, WeightedRandomSampler
+from torchvision import transforms, datasets
+from PIL import Image
+import numpy as np
+from typing import Tuple, Dict, List, Optional
+from collections import Counter
+import random
+class TelecomSiteDataset(Dataset):
+    """
+    Custom dataset for telecom site images
+    Supports both training and validation modes with appropriate transforms
+    """
+    def __init__(self, data_dir: str, split: str = 'train', image_size: int = 224):
+        """
+        Initialize telecom site dataset
+        Args:
+            data_dir: Root directory containing train/val folders
+            split: 'train' or 'val'
+            image_size: Size to resize images to
+        """
+        self.data_dir = data_dir
+        self.split = split
+        self.image_size = image_size
+        # Define class mapping
+        self.classes = ['bad', 'good']  # 0: bad, 1: good
+        self.class_to_idx = {cls: idx for idx, cls in enumerate(self.classes)}
+        # Load image paths and labels
+        self.samples = self._load_samples()
+        # Define transforms
+        self.transform = self._get_transforms()
+        print(f"📊 {split.upper()} Dataset loaded:")
+        print(f"   Total samples: {len(self.samples)}")
+        print(f"   Classes: {self.classes}")
+        self._print_class_distribution()
+    def _load_samples(self) -> List[Tuple[str, int]]:
+        """Load image paths and corresponding labels"""
+        samples = []
+        split_dir = os.path.join(self.data_dir, self.split)
+        for class_name in self.classes:
+            class_dir = os.path.join(split_dir, class_name)
+            if not os.path.exists(class_dir):
+                print(f"⚠️ Warning: {class_dir} not found")
+                continue
+            class_idx = self.class_to_idx[class_name]
+            # Load all images from class directory
+            for img_name in os.listdir(class_dir):
+                if img_name.lower().endswith(('.png', '.jpg', '.jpeg', '.bmp', '.tiff')):
+                    img_path = os.path.join(class_dir, img_name)
+                    samples.append((img_path, class_idx))
+        return samples
+    def _print_class_distribution(self):
+        """Print class distribution for the dataset"""
+        class_counts = Counter([label for _, label in self.samples])
+        for class_name, class_idx in self.class_to_idx.items():
+            count = class_counts.get(class_idx, 0)
+            print(f"   {class_name}: {count} samples")
+    def _get_transforms(self) -> transforms.Compose:
+        """Get appropriate transforms for the split"""
+        if self.split == 'train':
+            return transforms.Compose([
+                transforms.Resize((self.image_size + 32, self.image_size + 32)),
+                transforms.RandomResizedCrop(self.image_size, scale=(0.8, 1.0)),
+                transforms.RandomHorizontalFlip(p=0.5),
+                transforms.RandomRotation(degrees=10),
+                transforms.ColorJitter(
+                    brightness=0.2,
+                    contrast=0.2,
+                    saturation=0.2,
+                    hue=0.1
+                ),
+                transforms.ToTensor(),
+                transforms.Normalize(
+                    mean=[0.485, 0.456, 0.406],
+                    std=[0.229, 0.224, 0.225]
+                ),
+                transforms.RandomErasing(p=0.1, scale=(0.02, 0.08))
+            ])
+        else:
+            return transforms.Compose([
+                transforms.Resize((self.image_size, self.image_size)),
+                transforms.ToTensor(),
+                transforms.Normalize(
+                    mean=[0.485, 0.456, 0.406],
+                    std=[0.229, 0.224, 0.225]
+                )
+            ])
+    def __len__(self) -> int:
+        return len(self.samples)
+    def __getitem__(self, idx: int) -> Tuple[torch.Tensor, int]:
+        """Get a sample from the dataset"""
+        img_path, label = self.samples[idx]
+        # Load image
+        try:
+            image = Image.open(img_path).convert('RGB')
+        except Exception as e:
+            print(f"⚠️ Error loading image {img_path}: {e}")
+            # Return a black image as fallback
+            image = Image.new('RGB', (self.image_size, self.image_size), color='black')
+        # Apply transforms
+        if self.transform:
+            image = self.transform(image)
+        return image, label
+def create_data_loaders(
+    data_dir: str,
+    batch_size: int = 16,
+    num_workers: int = 4,
+    image_size: int = 224,
+    use_weighted_sampling: bool = True
+) -> Tuple[DataLoader, DataLoader]:
+    """
+    Create train and validation data loaders
+    Args:
+        data_dir: Root directory containing train/val folders
+        batch_size: Batch size for data loaders
+        num_workers: Number of worker processes
+        image_size: Size to resize images to
+        use_weighted_sampling: Whether to use weighted sampling for imbalanced data
+    Returns:
+        Tuple of (train_loader, val_loader)
+    """
+    # Create datasets
+    train_dataset = TelecomSiteDataset(data_dir, 'train', image_size)
+    val_dataset = TelecomSiteDataset(data_dir, 'val', image_size)
+    # Create samplers
+    train_sampler = None
+    if use_weighted_sampling and len(train_dataset) > 0:
+        train_sampler = create_weighted_sampler(train_dataset)
+    # Create data loaders
+    train_loader = DataLoader(
+        train_dataset,
+        batch_size=batch_size,
+        sampler=train_sampler,
+        shuffle=(train_sampler is None),
+        num_workers=num_workers,
+        pin_memory=torch.cuda.is_available(),
+        drop_last=True
+    )
+    val_loader = DataLoader(
+        val_dataset,
+        batch_size=batch_size,
+        shuffle=False,
+        num_workers=num_workers,
+        pin_memory=torch.cuda.is_available()
+    )
+    print(f"📦 Data loaders created:")
+    print(f"   Batch size: {batch_size}")
+    print(f"   Num workers: {num_workers}")
+    print(f"   Train batches: {len(train_loader)}")
+    print(f"   Val batches: {len(val_loader)}")
+    print(f"   Weighted sampling: {use_weighted_sampling}")
+    return train_loader, val_loader
+def create_weighted_sampler(dataset: TelecomSiteDataset) -> WeightedRandomSampler:
+    """
+    Create weighted random sampler for imbalanced datasets
+    Args:
+        dataset: The dataset to create sampler for
+    Returns:
+        WeightedRandomSampler for balanced sampling
+    """
+    # Count samples per class
+    class_counts = Counter([label for _, label in dataset.samples])
+    total_samples = len(dataset.samples)
+    # Calculate weights (inverse frequency)
+    class_weights = {}
+    for class_idx in range(len(dataset.classes)):
+        class_weights[class_idx] = total_samples / (len(dataset.classes) * class_counts.get(class_idx, 1))
+    # Create sample weights
+    sample_weights = [class_weights[label] for _, label in dataset.samples]
+    sampler = WeightedRandomSampler(
+        weights=sample_weights,
+        num_samples=len(sample_weights),
+        replacement=True
+    )
+    print(f"⚖️ Weighted sampler created:")
+    for class_name, class_idx in dataset.class_to_idx.items():
+        print(f"   {class_name}: weight={class_weights[class_idx]:.3f}")
+    return sampler
+def get_inference_transform(image_size: int = 224) -> transforms.Compose:
+    """
+    Get transform for inference/prediction
+    Args:
+        image_size: Size to resize images to
+    Returns:
+        Transform pipeline for inference
+    """
+    return transforms.Compose([
+        transforms.Resize((image_size, image_size)),
+        transforms.ToTensor(),
+        transforms.Normalize(
+            mean=[0.485, 0.456, 0.406],
+            std=[0.229, 0.224, 0.225]
+        )
+    ])
+def prepare_image_for_inference(image: Image.Image, transform: transforms.Compose) -> torch.Tensor:
+    """
+    Prepare a PIL image for model inference
+    Args:
+        image: PIL Image
+        transform: Transform pipeline
+    Returns:
+        Preprocessed tensor ready for model
+    """
+    if image.mode != 'RGB':
+        image = image.convert('RGB')
+    # Apply transforms and add batch dimension
+    tensor = transform(image).unsqueeze(0)
+    return tensor
+def visualize_batch(data_loader: DataLoader, num_samples: int = 8) -> None:
+    """
+    Visualize a batch of images from the data loader
+    Args:
+        data_loader: DataLoader to sample from
+        num_samples: Number of samples to visualize
+    """
+    try:
+        import matplotlib.pyplot as plt
+        # Get a batch
+        batch_images, batch_labels = next(iter(data_loader))
+        # Denormalize images for visualization
+        mean = torch.tensor([0.485, 0.456, 0.406]).view(3, 1, 1)
+        std = torch.tensor([0.229, 0.224, 0.225]).view(3, 1, 1)
+        # Create figure
+        fig, axes = plt.subplots(2, 4, figsize=(12, 6))
+        axes = axes.flatten()
+        class_names = ['Bad', 'Good']
+        for i in range(min(num_samples, len(batch_images))):
+            # Denormalize
+            img = batch_images[i] * std + mean
+            img = torch.clamp(img, 0, 1)
+            # Convert to numpy and transpose
+            img_np = img.permute(1, 2, 0).numpy()
+            # Plot
+            axes[i].imshow(img_np)
+            axes[i].set_title(f'Class: {class_names[batch_labels[i]]}')
+            axes[i].axis('off')
+        plt.tight_layout()
+        plt.show()
+    except ImportError:
+        print("⚠️ Matplotlib not available for visualization")
+def check_data_directory(data_dir: str) -> Dict[str, int]:
+    """
+    Check the data directory structure and count samples
+    Args:
+        data_dir: Root directory to check
+    Returns:
+        Dictionary with sample counts
+    """
+    print(f"📂 Checking data directory: {data_dir}")
+    if not os.path.exists(data_dir):
+        print(f"❌ Data directory not found: {data_dir}")
+        return {}
+    counts = {}
+    for split in ['train', 'val']:
+        split_dir = os.path.join(data_dir, split)
+        if not os.path.exists(split_dir):
+            print(f"⚠️ {split} directory not found")
+            continue
+        split_counts = {}
+        for class_name in ['good', 'bad']:
+            class_dir = os.path.join(split_dir, class_name)
+            if os.path.exists(class_dir):
+                image_files = [f for f in os.listdir(class_dir)
+                             if f.lower().endswith(('.png', '.jpg', '.jpeg', '.bmp', '.tiff'))]
+                split_counts[class_name] = len(image_files)
+            else:
+                split_counts[class_name] = 0
+        counts[split] = split_counts
+        print(f"   {split.upper()}: Good={split_counts['good']}, Bad={split_counts['bad']}")
+    return counts
+def create_sample_data_structure():
+    """
+    Create sample data directory structure with instructions
+    """
+    instructions = """
+📁 Data Directory Structure:
+data/
+├── train/
+│   ├── good/          # Place good telecom site images here
+│   │   ├── good_site_001.jpg
+│   │   ├── good_site_002.jpg
+│   │   └── ...
+│   └── bad/           # Place bad telecom site images here
+│       ├── bad_site_001.jpg
+│       ├── bad_site_002.jpg
+│       └── ...
+└── val/
+    ├── good/          # Validation good images
+    │   ├── val_good_001.jpg
+    │   └── ...
+    └── bad/           # Validation bad images
+        ├── val_bad_001.jpg
+        └── ...
+📋 Data Requirements:
+- Minimum 50 images per class for training
+- 20% of data should be reserved for validation
+- Images should be clear and well-lit
+- Recommended resolution: 224x224 or higher
+- Supported formats: JPG, PNG, JPEG, BMP, TIFF
+📊 Good Site Criteria:
+- Proper cable assembly and routing
+- All cards correctly installed and labeled
+- Clean and organized equipment layout
+- Proper grounding and safety measures
+- Clear and readable labels
+📊 Bad Site Criteria:
+- Messy or improper cable routing
+- Missing or incorrectly installed cards
+- Poor equipment organization
+- Missing or unreadable labels
+- Safety issues or violations
+"""
+    print(instructions)
+    return instructions

utils/model_utils.py ADDED Viewed

	@@ -0,0 +1,294 @@

+"""
+Model utilities for telecom site classification
+Handles ConvNeXt model loading and adaptation for transfer learning
+"""
+import torch
+import torch.nn as nn
+import timm
+import os
+from typing import Dict, Any, Optional, Tuple
+class TelecomClassifier(nn.Module):
+    """
+    ConvNeXt-based telecom site classifier
+    Uses transfer learning from food detection model
+    """
+    def __init__(self, num_classes: int = 2, pretrained: bool = True):
+        super(TelecomClassifier, self).__init__()
+        # Load ConvNeXt Large model (same as food detection)
+        self.backbone = timm.create_model(
+            'convnext_large.fb_in22k_ft_in1k',
+            pretrained=pretrained,
+            num_classes=0  # Remove classification head
+        )
+        # Get feature dimensions
+        self.feature_dim = self.backbone.num_features
+        # Custom classification head for telecom sites
+        self.classifier = nn.Sequential(
+            nn.LayerNorm(self.feature_dim),
+            nn.Linear(self.feature_dim, 512),
+            nn.ReLU(inplace=True),
+            nn.Dropout(0.3),
+            nn.Linear(512, 128),
+            nn.ReLU(inplace=True),
+            nn.Dropout(0.2),
+            nn.Linear(128, num_classes)
+        )
+        # Initialize classifier weights
+        self._init_classifier_weights()
+    def _init_classifier_weights(self):
+        """Initialize classifier weights using Xavier initialization"""
+        for module in self.classifier.modules():
+            if isinstance(module, nn.Linear):
+                nn.init.xavier_uniform_(module.weight)
+                nn.init.constant_(module.bias, 0)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Forward pass through the model"""
+        # Extract features using ConvNeXt backbone
+        features = self.backbone(x)
+        # Classify using custom head
+        output = self.classifier(features)
+        return output
+    def freeze_backbone(self):
+        """Freeze backbone parameters for transfer learning"""
+        for param in self.backbone.parameters():
+            param.requires_grad = False
+        print("🔒 Backbone frozen for transfer learning")
+    def unfreeze_backbone(self):
+        """Unfreeze backbone parameters for fine-tuning"""
+        for param in self.backbone.parameters():
+            param.requires_grad = True
+        print("🔓 Backbone unfrozen for fine-tuning")
+    def get_parameter_count(self) -> Dict[str, int]:
+        """Get parameter counts for different parts of the model"""
+        backbone_params = sum(p.numel() for p in self.backbone.parameters())
+        classifier_params = sum(p.numel() for p in self.classifier.parameters())
+        total_params = backbone_params + classifier_params
+        trainable_params = sum(p.numel() for p in self.parameters() if p.requires_grad)
+        return {
+            'backbone': backbone_params,
+            'classifier': classifier_params,
+            'total': total_params,
+            'trainable': trainable_params
+        }
+def load_food_model_weights(model: TelecomClassifier, food_model_path: str) -> TelecomClassifier:
+    """
+    Load weights from the pre-trained food detection model
+    Only loads the backbone weights, ignoring the classification head
+    """
+    if not os.path.exists(food_model_path):
+        print(f"⚠️ Food model not found at {food_model_path}")
+        print("🚀 Using ImageNet pretrained weights instead")
+        return model
+    try:
+        print(f"📂 Loading food model weights from {food_model_path}")
+        # Load the food model checkpoint
+        checkpoint = torch.load(food_model_path, map_location='cpu')
+        # Handle different checkpoint formats
+        if isinstance(checkpoint, dict):
+            if 'model_state_dict' in checkpoint:
+                food_state_dict = checkpoint['model_state_dict']
+                accuracy = checkpoint.get('best_acc', 'Unknown')
+                print(f"📊 Food model accuracy: {accuracy}%")
+            else:
+                food_state_dict = checkpoint
+        else:
+            food_state_dict = checkpoint
+        # Create a new state dict with only backbone weights
+        backbone_state_dict = {}
+        for key, value in food_state_dict.items():
+            # Only include backbone weights (exclude head/classifier)
+            if not key.startswith('head') and not key.startswith('classifier'):
+                backbone_state_dict[f"backbone.{key}"] = value
+        # Load backbone weights into our model
+        model_dict = model.state_dict()
+        # Filter out keys that don't match our model structure
+        filtered_dict = {}
+        for key, value in backbone_state_dict.items():
+            if key in model_dict and model_dict[key].shape == value.shape:
+                filtered_dict[key] = value
+        # Update model with filtered weights
+        model_dict.update(filtered_dict)
+        model.load_state_dict(model_dict)
+        print(f"✅ Successfully loaded {len(filtered_dict)} backbone layers from food model")
+        print(f"🎯 Transfer learning ready: backbone initialized with food detection weights")
+        return model
+    except Exception as e:
+        print(f"❌ Error loading food model weights: {e}")
+        print("🚀 Using ImageNet pretrained weights instead")
+        return model
+def create_telecom_model(
+    num_classes: int = 2,
+    food_model_path: Optional[str] = None,
+    freeze_backbone: bool = True
+) -> TelecomClassifier:
+    """
+    Create telecom classifier model with transfer learning from food detection
+    Args:
+        num_classes: Number of output classes (2 for good/bad)
+        food_model_path: Path to pre-trained food detection model
+        freeze_backbone: Whether to freeze backbone for transfer learning
+    Returns:
+        TelecomClassifier model ready for training
+    """
+    print("🏗️ Creating telecom site classifier...")
+    # Create the model
+    model = TelecomClassifier(num_classes=num_classes, pretrained=True)
+    # Load food model weights if available
+    if food_model_path:
+        model = load_food_model_weights(model, food_model_path)
+    # Freeze backbone if requested
+    if freeze_backbone:
+        model.freeze_backbone()
+    # Print model information
+    param_counts = model.get_parameter_count()
+    print(f"📊 Model Statistics:")
+    print(f"   Backbone parameters: {param_counts['backbone']:,}")
+    print(f"   Classifier parameters: {param_counts['classifier']:,}")
+    print(f"   Total parameters: {param_counts['total']:,}")
+    print(f"   Trainable parameters: {param_counts['trainable']:,}")
+    print(f"   Model size: ~{param_counts['total'] * 4 / 1024**2:.1f} MB")
+    return model
+def save_model(
+    model: TelecomClassifier,
+    save_path: str,
+    epoch: int,
+    best_acc: float,
+    optimizer_state: Optional[Dict] = None,
+    additional_info: Optional[Dict] = None
+) -> None:
+    """
+    Save model checkpoint with training information
+    Args:
+        model: The model to save
+        save_path: Path to save the model
+        epoch: Current epoch number
+        best_acc: Best validation accuracy achieved
+        optimizer_state: Optimizer state dict
+        additional_info: Additional information to save
+    """
+    checkpoint = {
+        'epoch': epoch,
+        'model_state_dict': model.state_dict(),
+        'best_acc': best_acc,
+        'model_info': {
+            'architecture': 'ConvNeXt Large',
+            'num_classes': 2,
+            'parameter_count': model.get_parameter_count(),
+            'task': 'telecom_site_classification'
+        }
+    }
+    if optimizer_state:
+        checkpoint['optimizer_state_dict'] = optimizer_state
+    if additional_info:
+        checkpoint.update(additional_info)
+    torch.save(checkpoint, save_path)
+    print(f"💾 Model saved to {save_path}")
+def load_model(
+    model_path: str,
+    num_classes: int = 2,
+    device: str = 'cpu'
+) -> Tuple[TelecomClassifier, Dict[str, Any]]:
+    """
+    Load trained telecom classifier model
+    Args:
+        model_path: Path to saved model
+        num_classes: Number of output classes
+        device: Device to load model on
+    Returns:
+        Tuple of (model, model_info)
+    """
+    print(f"📂 Loading model from {model_path}")
+    # Create model architecture
+    model = TelecomClassifier(num_classes=num_classes, pretrained=False)
+    # Load checkpoint
+    checkpoint = torch.load(model_path, map_location=device)
+    # Load model weights
+    model.load_state_dict(checkpoint['model_state_dict'])
+    model.eval()
+    # Extract model information
+    model_info = checkpoint.get('model_info', {})
+    model_info['best_acc'] = checkpoint.get('best_acc', 'Unknown')
+    model_info['epoch'] = checkpoint.get('epoch', 'Unknown')
+    print(f"✅ Model loaded successfully")
+    print(f"   Best accuracy: {model_info.get('best_acc', 'Unknown')}")
+    print(f"   Epoch: {model_info.get('epoch', 'Unknown')}")
+    return model, model_info
+def get_model_summary(model: TelecomClassifier) -> str:
+    """
+    Get a formatted summary of the model
+    Args:
+        model: The model to summarize
+    Returns:
+        Formatted string with model information
+    """
+    param_counts = model.get_parameter_count()
+    summary = f"""
+🤖 Telecom Site Classifier Model Summary
+{'='*50}
+Architecture: ConvNeXt Large + Custom Classifier
+Task: Binary Classification (Good/Bad Sites)
+Parameter Counts:
+  Backbone (ConvNeXt): {param_counts['backbone']:,}
+  Classifier Head: {param_counts['classifier']:,}
+  Total Parameters: {param_counts['total']:,}
+  Trainable Parameters: {param_counts['trainable']:,}
+Model Size: ~{param_counts['total'] * 4 / 1024**2:.1f} MB
+Transfer Learning: {'Enabled' if param_counts['trainable'] < param_counts['total'] else 'Disabled'}
+"""
+    return summary