Upload 9 files

Browse files

Files changed (9) hide show

multiclass_model.pth +3 -0
phase_1b_sample_solution_multiclass.py +143 -0
script.py +80 -0
utils/__init__.py +0 -0
utils/__pycache__/__init__.cpython-314.pyc +0 -0
utils/__pycache__/__init__.cpython-39.pyc +0 -0
utils/__pycache__/utils.cpython-314.pyc +0 -0
utils/__pycache__/utils.cpython-39.pyc +0 -0
utils/utils.py +56 -0

multiclass_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e9df2fa575a0d20999bffa87c6ed668352a8e7a3f141ebeeb66092280b19f6f
+size 43349799

phase_1b_sample_solution_multiclass.py ADDED Viewed

	@@ -0,0 +1,143 @@

+import pandas as pd
+import os
+import re
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from torch.utils.data import DataLoader
+import timm
+from sklearn.metrics import classification_report
+from sklearn.model_selection import StratifiedGroupKFold
+from sklearn.utils.class_weight import compute_class_weight
+from submission.utils.utils import ImageData
+import torchvision.transforms as transforms
+import numpy as np
+from tqdm import tqdm
+# --- CONFIGURATION ---
+BASE_PATH = "/Users/yusufbardolia/Documents/Intelligent System In Medicine/phase_1a"
+PATH_TO_IMAGES = os.path.join(BASE_PATH, "images")
+PATH_TO_GT = os.path.join(BASE_PATH, "gt_for_classification_multiclass_from_filenames_0_index.csv")
+PATH_TO_SPLIT_GT = os.path.join(os.getcwd(), "honest_split_gt.csv")
+MODEL_SAVE_PATH = os.path.join("submission", "multiclass_model.pth")
+# --- UPGRADES ---
+MODEL_NAME = 'efficientnet_b3' # Larger, more powerful model
+IMAGE_SIZE = (300, 300)        # EfficientNet-B3 native resolution
+MAX_EPOCHS = 15
+BATCH_SIZE = 16                # Smaller batch for larger model
+NUM_CLASSES = 3
+LEARNING_RATE = 0.0003
+if torch.backends.mps.is_available():
+    DEVICE = "mps"
+    print(f"✅ Using Apple M-Series GPU (MPS)")
+else:
+    DEVICE = "cpu"
+def create_honest_split():
+    print("Creating honest, stratified data split...")
+    df = pd.read_csv(PATH_TO_GT)
+    surgery_dates = []
+    for fname in df["file_name"]:
+        match = re.search(r'(202\d{5})', fname)
+        surgery_dates.append(match.group(1) if match else "unknown")
+    groups = np.array(surgery_dates)
+    y = df["category_id"].values
+    sgkf = StratifiedGroupKFold(n_splits=5, shuffle=True, random_state=42)
+    train_idx, val_idx = next(sgkf.split(df, y, groups=groups))
+    df["validation_set"] = 0
+    df.loc[val_idx, "validation_set"] = 1
+    df.to_csv(PATH_TO_SPLIT_GT, index=False)
+    classes = np.unique(y)
+    weights = compute_class_weight(class_weight='balanced', classes=classes, y=y[train_idx])
+    return PATH_TO_SPLIT_GT, torch.tensor(weights, dtype=torch.float32).to(DEVICE)
+def main():
+    split_csv_path, class_weights = create_honest_split()
+    # 2. Transforms (Heavy Augmentation)
+    train_transforms = transforms.Compose([
+        transforms.Resize((320, 320)),       # Resize larger first
+        transforms.RandomCrop(IMAGE_SIZE),   # Then random crop (better data aug)
+        transforms.RandomHorizontalFlip(p=0.5),
+        transforms.RandomVerticalFlip(p=0.5),
+        transforms.RandomRotation(degrees=45),
+        transforms.ColorJitter(brightness=0.2, contrast=0.2, saturation=0.2, hue=0.1),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+    ])
+    val_transforms = transforms.Compose([
+        transforms.Resize(IMAGE_SIZE),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+    ])
+    train_dataset = ImageData(PATH_TO_IMAGES, split_csv_path, validation_set=0, transform=train_transforms)
+    val_dataset = ImageData(PATH_TO_IMAGES, split_csv_path, validation_set=1, transform=val_transforms)
+    train_loader = DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True, num_workers=0)
+    val_loader = DataLoader(val_dataset, batch_size=BATCH_SIZE, shuffle=False, num_workers=0)
+    print(f"Loading {MODEL_NAME}...")
+    model = timm.create_model(MODEL_NAME, pretrained=True, num_classes=NUM_CLASSES)
+    model = model.to(DEVICE)
+    criterion = nn.CrossEntropyLoss(weight=class_weights, label_smoothing=0.1)
+    optimizer = optim.AdamW(model.parameters(), lr=LEARNING_RATE, weight_decay=0.01)
+    scheduler = optim.lr_scheduler.OneCycleLR(optimizer, max_lr=LEARNING_RATE, steps_per_epoch=len(train_loader), epochs=MAX_EPOCHS)
+    print(f"Starting training...")
+    best_f1 = 0.0
+    for epoch in range(MAX_EPOCHS):
+        model.train()
+        pbar = tqdm(train_loader, desc=f"Epoch {epoch+1}")
+        for img, label in pbar:
+            img, label = img.to(DEVICE), label.to(DEVICE)
+            optimizer.zero_grad()
+            output = model(img)
+            loss = criterion(output, label)
+            loss.backward()
+            optimizer.step()
+            scheduler.step()
+            pbar.set_postfix({"Loss": f"{loss.item():.4f}"})
+        # Validation
+        model.eval()
+        all_preds = []
+        all_labels = []
+        with torch.no_grad():
+            for img, label in val_loader:
+                img, label = img.to(DEVICE), label.to(DEVICE)
+                output = model(img)
+                preds = torch.argmax(output, dim=1).cpu().numpy()
+                all_preds.extend(preds)
+                all_labels.extend(label.cpu().numpy())
+        report = classification_report(all_labels, all_preds, output_dict=True, zero_division=0)
+        curr_f1 = report['macro avg']['f1-score']
+        print(f"Val F1: {curr_f1:.4f}")
+        if curr_f1 > best_f1:
+            best_f1 = curr_f1
+            torch.save(model.state_dict(), MODEL_SAVE_PATH)
+            print(f"🚀 Saved {MODEL_SAVE_PATH}")
+    print(f"Done. Best F1: {best_f1:.4f}")
+if __name__ == "__main__":
+    if not os.path.exists("submission"): os.makedirs("submission")
+    main()

script.py ADDED Viewed

	@@ -0,0 +1,80 @@

+import os
+import torch
+import pandas as pd
+import timm
+from PIL import Image
+from torchvision import transforms
+from scipy.stats import mode
+import torch.nn.functional as F
+# CONFIG MUST MATCH TRAINING
+MODEL_NAME = 'efficientnet_b3'
+IMAGE_SIZE = (300, 300)
+NUM_CLASSES = 3
+DEVICE = "mps" if torch.backends.mps.is_available() else "cpu"
+def apply_temporal_smoothing(predictions, window_size=5):
+    smoothed_preds = predictions.copy()
+    for i in range(len(predictions)):
+        start = max(0, i - window_size // 2)
+        end = min(len(predictions), i + window_size // 2 + 1)
+        window = predictions[start:end]
+        most_common = mode(window, keepdims=False)[0]
+        smoothed_preds[i] = most_common
+    return smoothed_preds
+def run_inference(TEST_IMAGE_PATH, model, SUBMISSION_CSV_SAVE_PATH):
+    model.eval()
+    test_images = os.listdir(TEST_IMAGE_PATH)
+    test_images.sort()
+    transform = transforms.Compose([
+        transforms.Resize(IMAGE_SIZE),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+    ])
+    raw_predictions = []
+    print(f"Inference with TTA on {len(test_images)} images...")
+    with torch.no_grad():
+        for img_name in test_images:
+            img_path = os.path.join(TEST_IMAGE_PATH, img_name)
+            try:
+                # Load Original
+                img_pil = Image.open(img_path).convert("RGB")
+                img_tensor = transform(img_pil).unsqueeze(0).to(DEVICE)
+                # Load Flipped (TTA)
+                img_flip = transform(img_pil.transpose(Image.FLIP_LEFT_RIGHT)).unsqueeze(0).to(DEVICE)
+                # Predict both
+                out1 = model(img_tensor)
+                out2 = model(img_flip)
+                # Average probabilities
+                avg_out = (F.softmax(out1, dim=1) + F.softmax(out2, dim=1)) / 2
+                pred = torch.argmax(avg_out, dim=1).item()
+                raw_predictions.append(pred)
+            except Exception as e:
+                print(f"Error {img_name}: {e}")
+                raw_predictions.append(0)
+    final_predictions = apply_temporal_smoothing(raw_predictions, window_size=5)
+    df = pd.DataFrame({"file_name": test_images, "category_id": final_predictions})
+    df.to_csv(SUBMISSION_CSV_SAVE_PATH, index=False)
+    print(f"Saved to {SUBMISSION_CSV_SAVE_PATH}")
+if __name__ == "__main__":
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+    TEST_PATH = "/tmp/data/test_images"
+    MODEL_PATH = os.path.join(current_dir, "multiclass_model.pth")
+    SUB_PATH = os.path.join(current_dir, "submission.csv")
+    model = timm.create_model(MODEL_NAME, pretrained=False, num_classes=NUM_CLASSES)
+    model.load_state_dict(torch.load(MODEL_PATH, map_location=DEVICE))
+    model = model.to(DEVICE)
+    run_inference(TEST_PATH, model, SUB_PATH)

utils/__init__.py ADDED Viewed

File without changes

utils/__pycache__/__init__.cpython-314.pyc ADDED Viewed

Binary file (198 Bytes). View file

utils/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (171 Bytes). View file

utils/__pycache__/utils.cpython-314.pyc ADDED Viewed

Binary file (2.79 kB). View file

utils/__pycache__/utils.cpython-39.pyc ADDED Viewed

Binary file (1.27 kB). View file

utils/utils.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import os
+import pandas as pd
+import numpy as np
+from torch.utils.data import Dataset
+from PIL import Image
+class ImageData(Dataset):
+    def __init__(self, img_dir, annotation_file, validation_set, transform=None):
+        """
+        Custom Dataset that respects the 'validation_set' column in the CSV.
+        0 = Training Set
+        1 = Validation Set
+        """
+        # Read the CSV file
+        try:
+            gt = pd.read_csv(annotation_file)
+        except Exception as e:
+            print(f"Error reading CSV {annotation_file}: {e}")
+            # Return empty if failed, to prevent crash during init
+            self.img_labels = pd.DataFrame()
+            self.img_dir = img_dir
+            self.transform = transform
+            self.images = []
+            self.labels = []
+            return
+        # Filter: 0 = Train, 1 = Validation
+        if validation_set:
+            self.img_labels = gt[gt["validation_set"] == 1].reset_index(drop=True)
+        else:
+            self.img_labels = gt[gt["validation_set"] == 0].reset_index(drop=True)
+        self.img_dir = img_dir
+        self.transform = transform
+        # Store filenames and labels
+        self.images = self.img_labels["file_name"].values
+        self.labels = self.img_labels["category_id"].values
+    def __len__(self):
+        return len(self.img_labels)
+    def __getitem__(self, idx):
+        img_name = self.images[idx]
+        img_path = os.path.join(self.img_dir, img_name)
+        # CRITICAL: Open in RGB mode. OpenCV loads BGR by default, but PIL is safer here.
+        image = Image.open(img_path).convert("RGB")
+        label = self.labels[idx]
+        if self.transform:
+            image = self.transform(image)
+        # Return image and label (as long/int for CrossEntropyLoss)
+        return image, int(label)