Spaces:

Sairii
/

FoodVision__Mini

Build error

App Files Files Community

Sairii commited on May 29, 2025

Commit

ce714e8

verified ·

1 Parent(s): aafc84f

Upload 8 files

Browse files

Files changed (8) hide show

09-foodvision-mini-inference-speed-vs-performance.png +0 -0
app.py +79 -0
examples/2582289.jpg +0 -0
examples/3622237.jpg +0 -0
examples/592799.jpg +0 -0
helper_functions.py +294 -0
model.py +42 -0
requirements.txt +4 -0

09-foodvision-mini-inference-speed-vs-performance.png ADDED Viewed

app.py ADDED Viewed

	@@ -0,0 +1,79 @@

+### 1. Import and class names setup ###
+import gradio as gr
+import os
+import torch
+from model import create_effnet_b2_model
+from timeit import default_timer as timer
+from typing import Tuple, Dict
+# Setup class names
+class_names = ["pizza", "steak", "sushi"]
+### 2. Model and transforms preparation ###
+effnet_b2, effnet_b2_transforms = create_effnet_b2_model(
+    num_classes= len(class_names))
+# Load save weights
+effnet_b2.load_state_dict(
+    torch.load(f"09_pretrained_effnetb2_feature_extractor_steak_sushi_20_percent.pth",
+               map_location = torch.device("cpu"))
+)
+### 3. Predict function ###
+def predict(img) -> Tuple[Dict, float]:
+  # Start a timer
+  start_time = timer()
+  # Tranform the input image for use with EffNetB2and add a batch dimension
+  img = effnet_b2_transforms(img).unsqueeze(0)
+  # Put model into eval mode, make prediction
+  effnet_b2.eval()
+  with torch.inference_mode():
+    # Pass transformed image through the model and turn the prediction logits into probabilites
+    pred_probs = torch.softmax(effnet_b2(img), dim =1)
+  # Create a prediction label, and prediction probability dictionary
+  pred_labels_and_probs= {class_names[i]: float(pred_probs[0][i]) for i in range (len (class_names))}
+  # Calculate pred time
+  end_time = timer()
+  pred_time = round(end_time - start_time, 4)
+  # Return pred dict and pred time
+  return pred_labels_and_probs, pred_time
+### 4. Gradio app ###
+# Create title, description and article
+title = "FoodVision Mini 🍕🥩🍣"
+description = " An [EffNetB2 feature extractor](https://docs.pytorch.org/vision/0.21/models/generated/torchvision.models.efficientnet_b2.html#efficientnet-b2) computer vision model to classify images as pizza, steak or sushi"
+article = "Created at [09. PyTorch Model Deployment](https://www.learnpytorch.io/09_pytorch_model_deployment/)"
+# Create example list
+example_list = [["examples/" + example] for example in os.listdir("examples")]
+# Create the Gradio demo
+demo = gr.Interface(
+    fn = predict, # function we want to use
+    inputs =gr.Image(type="pil"),
+    outputs=[
+        gr.Label(num_top_classes = 3, label = "Predictions"),
+        gr.Number(label = "Prediction time (s)")],
+    examples = example_list,
+    title = title,
+    description = description,
+    article = article
+)
+# Launch the demo
+demo.launch(debug = False,
+            share = True)

examples/2582289.jpg ADDED Viewed

examples/3622237.jpg ADDED Viewed

examples/592799.jpg ADDED Viewed

helper_functions.py ADDED Viewed

	@@ -0,0 +1,294 @@

+"""
+A series of helper functions used throughout the course.
+If a function gets defined once and could be used over and over, it'll go in here.
+"""
+import torch
+import matplotlib.pyplot as plt
+import numpy as np
+from torch import nn
+import os
+import zipfile
+from pathlib import Path
+import requests
+# Walk through an image classification directory and find out how many files (images)
+# are in each subdirectory.
+import os
+def walk_through_dir(dir_path):
+    """
+    Walks through dir_path returning its contents.
+    Args:
+    dir_path (str): target directory
+    Returns:
+    A print out of:
+      number of subdiretories in dir_path
+      number of images (files) in each subdirectory
+      name of each subdirectory
+    """
+    for dirpath, dirnames, filenames in os.walk(dir_path):
+        print(f"There are {len(dirnames)} directories and {len(filenames)} images in '{dirpath}'.")
+def plot_decision_boundary(model: torch.nn.Module, X: torch.Tensor, y: torch.Tensor):
+    """Plots decision boundaries of model predicting on X in comparison to y.
+    Source - https://madewithml.com/courses/foundations/neural-networks/ (with modifications)
+    """
+    # Put everything to CPU (works better with NumPy + Matplotlib)
+    model.to("cpu")
+    X, y = X.to("cpu"), y.to("cpu")
+    # Setup prediction boundaries and grid
+    x_min, x_max = X[:, 0].min() - 0.1, X[:, 0].max() + 0.1
+    y_min, y_max = X[:, 1].min() - 0.1, X[:, 1].max() + 0.1
+    xx, yy = np.meshgrid(np.linspace(x_min, x_max, 101), np.linspace(y_min, y_max, 101))
+    # Make features
+    X_to_pred_on = torch.from_numpy(np.column_stack((xx.ravel(), yy.ravel()))).float()
+    # Make predictions
+    model.eval()
+    with torch.inference_mode():
+        y_logits = model(X_to_pred_on)
+    # Test for multi-class or binary and adjust logits to prediction labels
+    if len(torch.unique(y)) > 2:
+        y_pred = torch.softmax(y_logits, dim=1).argmax(dim=1)  # mutli-class
+    else:
+        y_pred = torch.round(torch.sigmoid(y_logits))  # binary
+    # Reshape preds and plot
+    y_pred = y_pred.reshape(xx.shape).detach().numpy()
+    plt.contourf(xx, yy, y_pred, cmap=plt.cm.RdYlBu, alpha=0.7)
+    plt.scatter(X[:, 0], X[:, 1], c=y, s=40, cmap=plt.cm.RdYlBu)
+    plt.xlim(xx.min(), xx.max())
+    plt.ylim(yy.min(), yy.max())
+# Plot linear data or training and test and predictions (optional)
+def plot_predictions(
+    train_data, train_labels, test_data, test_labels, predictions=None
+):
+    """
+  Plots linear training data and test data and compares predictions.
+  """
+    plt.figure(figsize=(10, 7))
+    # Plot training data in blue
+    plt.scatter(train_data, train_labels, c="b", s=4, label="Training data")
+    # Plot test data in green
+    plt.scatter(test_data, test_labels, c="g", s=4, label="Testing data")
+    if predictions is not None:
+        # Plot the predictions in red (predictions were made on the test data)
+        plt.scatter(test_data, predictions, c="r", s=4, label="Predictions")
+    # Show the legend
+    plt.legend(prop={"size": 14})
+# Calculate accuracy (a classification metric)
+def accuracy_fn(y_true, y_pred):
+    """Calculates accuracy between truth labels and predictions.
+    Args:
+        y_true (torch.Tensor): Truth labels for predictions.
+        y_pred (torch.Tensor): Predictions to be compared to predictions.
+    Returns:
+        [torch.float]: Accuracy value between y_true and y_pred, e.g. 78.45
+    """
+    correct = torch.eq(y_true, y_pred).sum().item()
+    acc = (correct / len(y_pred)) * 100
+    return acc
+def print_train_time(start, end, device=None):
+    """Prints difference between start and end time.
+    Args:
+        start (float): Start time of computation (preferred in timeit format).
+        end (float): End time of computation.
+        device ([type], optional): Device that compute is running on. Defaults to None.
+    Returns:
+        float: time between start and end in seconds (higher is longer).
+    """
+    total_time = end - start
+    print(f"\nTrain time on {device}: {total_time:.3f} seconds")
+    return total_time
+# Plot loss curves of a model
+def plot_loss_curves(results):
+    """Plots training curves of a results dictionary.
+    Args:
+        results (dict): dictionary containing list of values, e.g.
+            {"train_loss": [...],
+             "train_acc": [...],
+             "test_loss": [...],
+             "test_acc": [...]}
+    """
+    loss = results["train_loss"]
+    test_loss = results["test_loss"]
+    accuracy = results["train_acc"]
+    test_accuracy = results["test_acc"]
+    epochs = range(len(results["train_loss"]))
+    plt.figure(figsize=(15, 7))
+    # Plot loss
+    plt.subplot(1, 2, 1)
+    plt.plot(epochs, loss, label="train_loss")
+    plt.plot(epochs, test_loss, label="test_loss")
+    plt.title("Loss")
+    plt.xlabel("Epochs")
+    plt.legend()
+    # Plot accuracy
+    plt.subplot(1, 2, 2)
+    plt.plot(epochs, accuracy, label="train_accuracy")
+    plt.plot(epochs, test_accuracy, label="test_accuracy")
+    plt.title("Accuracy")
+    plt.xlabel("Epochs")
+    plt.legend()
+# Pred and plot image function from notebook 04
+# See creation: https://www.learnpytorch.io/04_pytorch_custom_datasets/#113-putting-custom-image-prediction-together-building-a-function
+from typing import List
+import torchvision
+def pred_and_plot_image(
+    model: torch.nn.Module,
+    image_path: str,
+    class_names: List[str] = None,
+    transform=None,
+    device: torch.device = "cuda" if torch.cuda.is_available() else "cpu",
+):
+    """Makes a prediction on a target image with a trained model and plots the image.
+    Args:
+        model (torch.nn.Module): trained PyTorch image classification model.
+        image_path (str): filepath to target image.
+        class_names (List[str], optional): different class names for target image. Defaults to None.
+        transform (_type_, optional): transform of target image. Defaults to None.
+        device (torch.device, optional): target device to compute on. Defaults to "cuda" if torch.cuda.is_available() else "cpu".
+    Returns:
+        Matplotlib plot of target image and model prediction as title.
+    Example usage:
+        pred_and_plot_image(model=model,
+                            image="some_image.jpeg",
+                            class_names=["class_1", "class_2", "class_3"],
+                            transform=torchvision.transforms.ToTensor(),
+                            device=device)
+    """
+    # 1. Load in image and convert the tensor values to float32
+    target_image = torchvision.io.read_image(str(image_path)).type(torch.float32)
+    # 2. Divide the image pixel values by 255 to get them between [0, 1]
+    target_image = target_image / 255.0
+    # 3. Transform if necessary
+    if transform:
+        target_image = transform(target_image)
+    # 4. Make sure the model is on the target device
+    model.to(device)
+    # 5. Turn on model evaluation mode and inference mode
+    model.eval()
+    with torch.inference_mode():
+        # Add an extra dimension to the image
+        target_image = target_image.unsqueeze(dim=0)
+        # Make a prediction on image with an extra dimension and send it to the target device
+        target_image_pred = model(target_image.to(device))
+    # 6. Convert logits -> prediction probabilities (using torch.softmax() for multi-class classification)
+    target_image_pred_probs = torch.softmax(target_image_pred, dim=1)
+    # 7. Convert prediction probabilities -> prediction labels
+    target_image_pred_label = torch.argmax(target_image_pred_probs, dim=1)
+    # 8. Plot the image alongside the prediction and prediction probability
+    plt.imshow(
+        target_image.squeeze().permute(1, 2, 0)
+    )  # make sure it's the right size for matplotlib
+    if class_names:
+        title = f"Pred: {class_names[target_image_pred_label.cpu()]} | Prob: {target_image_pred_probs.max().cpu():.3f}"
+    else:
+        title = f"Pred: {target_image_pred_label} | Prob: {target_image_pred_probs.max().cpu():.3f}"
+    plt.title(title)
+    plt.axis(False)
+def set_seeds(seed: int=42):
+    """Sets random sets for torch operations.
+    Args:
+        seed (int, optional): Random seed to set. Defaults to 42.
+    """
+    # Set the seed for general torch operations
+    torch.manual_seed(seed)
+    # Set the seed for CUDA torch operations (ones that happen on the GPU)
+    torch.cuda.manual_seed(seed)
+def download_data(source: str,
+                  destination: str,
+                  remove_source: bool = True) -> Path:
+    """Downloads a zipped dataset from source and unzips to destination.
+    Args:
+        source (str): A link to a zipped file containing data.
+        destination (str): A target directory to unzip data to.
+        remove_source (bool): Whether to remove the source after downloading and extracting.
+    Returns:
+        pathlib.Path to downloaded data.
+    Example usage:
+        download_data(source="https://github.com/mrdbourke/pytorch-deep-learning/raw/main/data/pizza_steak_sushi.zip",
+                      destination="pizza_steak_sushi")
+    """
+    # Setup path to data folder
+    data_path = Path("data/")
+    image_path = data_path / destination
+    # If the image folder doesn't exist, download it and prepare it...
+    if image_path.is_dir():
+        print(f"[INFO] {image_path} directory exists, skipping download.")
+    else:
+        print(f"[INFO] Did not find {image_path} directory, creating one...")
+        image_path.mkdir(parents=True, exist_ok=True)
+        # Download pizza, steak, sushi data
+        target_file = Path(source).name
+        with open(data_path / target_file, "wb") as f:
+            request = requests.get(source)
+            print(f"[INFO] Downloading {target_file} from {source}...")
+            f.write(request.content)
+        # Unzip pizza, steak, sushi data
+        with zipfile.ZipFile(data_path / target_file, "r") as zip_ref:
+            print(f"[INFO] Unzipping {target_file} data...")
+            zip_ref.extractall(image_path)
+        # Remove .zip file
+        if remove_source:
+            os.remove(data_path / target_file)
+    return image_path

model.py ADDED Viewed

	@@ -0,0 +1,42 @@

+import torch
+import torchvision
+from torch import nn
+def create_effnet_b2_model(num_classes: int = 3,
+                           seed: int = 42):
+  """
+  Creates an EfficientNetB2 feature extractor model and transforms.
+    Args:
+        num_classes (int, optional): number of classes in the classifier head.
+            Defaults to 3.
+        seed (int, optional): random seed value. Defaults to 42.
+    Returns:
+        model (torch.nn.Module): EffNetB2 feature extractor model.
+        transforms (torchvision.transforms): EffNetB2 image transforms.
+  """
+  # 1. Setup pretrained weights
+  weights = torchvision.models.EfficientNet_B2_Weights.DEFAULT
+  # 2.Get transforms
+  transforms = weights.transforms()
+  # 3. Cretate the pretrained model
+  model = torchvision.models.efficientnet_b2(weights=weights)
+  # 4. Freeze the base layer
+  for param in model.parameters():
+    param.requires_grad = False
+  # 5. Update the classifier head to suit our data with reproducibility
+  torch.manual_seed(seed)
+  model.classifier = nn.Sequential(
+      nn.Dropout(p=0.3, inplace=True),
+      nn.Linear(in_features=1408, out_features= num_classes)
+  )
+  return model, transforms

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+torch >= 2.0.0
+torchvision >= 0.15.0
+gradio >= 4.0.0