Spaces:

CSSE416-final-project
/

face-recognition

Sleeping

App Files Files Community

Winston de Jong commited on Nov 20, 2024

Commit

0da216f

1 Parent(s): 1c98b00

test running model

Browse files

Files changed (1) hide show

app.py +67 -18

app.py CHANGED Viewed

@@ -1,13 +1,18 @@
 import PIL.Image
 import gradio as gr
 import numpy as np
-import random
 import PIL
-import subprocess
-import sys
 import os
 import platform
 import time
 # by default, dlib will be compiled locally when installed via pip, which takes so long it
 # causes huggingface to time out during the build process.
@@ -20,9 +25,6 @@ start_time = time.time()
 import face_detection
 print(f"took {(time.time() - start_time) / 60} minutes to load face_recognition")
-# import spaces #[uncomment to use ZeroGPU]
-from diffusers import DiffusionPipeline
-import torch
 # # Function to display the uploaded image
 # def process_image(image : PIL.Image.Image):
@@ -30,23 +32,70 @@ import torch
 #     # do AI stuff here
 #     return gr.Image(outputs[0])
-def process_image_str(image : str):
-    locations, paths = face_detection.getFaceLocationsAndFiles(image, "outputs", "imgs")
-    # do AI stuff here
-    return gr.Image(image)
-# Create the Gradio interface
 interface = gr.Interface(
-    fn=process_image_str, # Function to process the image
-    inputs=gr.Image(type='filepath'), # Upload input
-    outputs=gr.Image(),  # Display output
     allow_flagging='never',
     title="Celebrity Face Detector",
     description="Upload a picture of a celebrity or group of celebrities to identify them"
 )
 if __name__ == "__main__":
-    interface.launch()

 import PIL.Image
 import gradio as gr
 import numpy as np
 import PIL
 import os
 import platform
 import time
+from huggingface_hub import hf_hub_download
+import huggingface_hub
+# import spaces #[uncomment to use ZeroGPU]
+from diffusers import DiffusionPipeline
+import torch
+from torch import nn
+import torchvision
 # by default, dlib will be compiled locally when installed via pip, which takes so long it
 # causes huggingface to time out during the build process.
 import face_detection
 print(f"took {(time.time() - start_time) / 60} minutes to load face_recognition")
 # # Function to display the uploaded image
 # def process_image(image : PIL.Image.Image):
 #     # do AI stuff here
 #     return gr.Image(outputs[0])
+model_repo_id = "CSSE416-final-project/faceRecogModel"
+weight_file_id = "matTemp.bin"
+# 1. Load the model from Hugging Face Hub
+def load_model(repo_id):
+    # Download the model weights from the repo
+    weights_path = hf_hub_download(repo_id=model_repo_id, filename=weight_file_id)
+    # Initialize the ResNet-18 architecture
+    model = torchvision.models.resnet18(pretrained=True) # TODO: does it matter if this is set to true or false?
+    num_ftrs = model.fc.in_features
+    model.fc = nn.Linear(num_ftrs, 100)  # Adjust for your task (e.g., 128 classes)
+    # TODO: check if this number^^ corresponds to the number of classes
+    # Load the model weights
+    state_dict = torch.load(weights_path, map_location=torch.device("cpu"))
+    model.load_state_dict(state_dict)
+    model.eval()  # Set the model to evaluation mode
+    return model
+# 2. Load model
+model = load_model(model_repo_id)
+# 3. Define how to transform image
+transforms = torchvision.transforms.Compose(
+[
+    torchvision.transforms.ToTensor()
+])
+# 4. Preprocess and display the image
+def process_image_str(groupImageFilePath: str):
+    groupImage = PIL.Image.open(groupImageFilePath)
+    locations, images = face_detection.getCroppedImages(groupImage)
+    outputLabels = []
+    for image in images:
+        # Process the image
+        intputTensor = transforms(image).unsqueeze(0) # unsqueeze? add batch dimension??
+        # do AI stuff here
+        with torch.no_grad():
+            outputs_t = model(intputTensor)
+            _, pred_t = torch.max(outputs_t, dim=1)
+            outputLabels.append(pred_t.item())
+    #return gr.Image(image)
+    return outputLabels.pop(0)
+# 5. Create the Gradio interface
 interface = gr.Interface(
+    fn=process_image_str,  # Function to process the image
+    inputs=gr.Image(type='filepath'),  # Upload input
+    # outputs=gr.Image(),  # Display output
+    outputs='text',
     allow_flagging='never',
     title="Celebrity Face Detector",
     description="Upload a picture of a celebrity or group of celebrities to identify them"
 )
+# 6. Launch the app
 if __name__ == "__main__":
+    interface.launch()