Spaces:

AI-Manith
/

SkinDet-vit

Sleeping

App Files Files Community

AI-Manith commited on Apr 5, 2024

Commit

ca41343

verified ·

1 Parent(s): e3fa2f0

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -7

app.py CHANGED Viewed

@@ -17,34 +17,39 @@ def load_model_and_mtcnn(model_path):
 def preprocess_image(image, mtcnn, device):
     processed_image = image  # Initialize with the original image
     try:
-        # The return_image parameter of MTCNN's forward method can return the original image along with detected faces, but here we directly pass the image
-        cropped_faces, _ = mtcnn(image, return_image=True)
         if cropped_faces is not None and len(cropped_faces) > 0:
             processed_image = cropped_faces[0]  # Use the first detected face
-        # No else clause needed; if no faces detected, processed_image remains the original
     except Exception as e:
         st.write(f"Exception in face detection: {e}")
         processed_image = image
     transform = transforms.Compose([
-        transforms.Resize((224, 224)),
         transforms.ToTensor(),
         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
     ])
-    image_tensor = transform(processed_image).to(device)
     image_tensor = image_tensor.unsqueeze(0)  # Add a batch dimension
-    return image_tensor, processed_image
 # Function for inference
 def predict(image_tensor, model, device):
     model.eval()
     with torch.no_grad():
         outputs = model(image_tensor)
         probabilities = torch.nn.functional.softmax(outputs.logits, dim=1)
         predicted_class = torch.argmax(probabilities, dim=1)
     return predicted_class, probabilities
-# Streamlit UI
 st.title("Face Detection and Classification with ViT")
 st.write("Upload an image, and the model will detect faces and classify the image.")
@@ -58,6 +63,7 @@ if uploaded_file is not None:
     image_tensor, final_image = preprocess_image(image, mtcnn, device)
     predicted_class, probabilities = predict(image_tensor, model, device)
     st.write(f"Predicted class: {predicted_class.item()}")
     # Display the final processed image
     st.image(final_image, caption='Processed Image', use_column_width=True)

 def preprocess_image(image, mtcnn, device):
     processed_image = image  # Initialize with the original image
     try:
+        # Directly call mtcnn with the image to get cropped faces
+        cropped_faces = mtcnn(image)
         if cropped_faces is not None and len(cropped_faces) > 0:
             processed_image = cropped_faces[0]  # Use the first detected face
     except Exception as e:
         st.write(f"Exception in face detection: {e}")
         processed_image = image
     transform = transforms.Compose([
+        transforms.Resize((224, 224)),
         transforms.ToTensor(),
         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
     ])
+    # Ensure processed_image is a PIL Image for the transformation
+    if not isinstance(processed_image, Image.Image):
+        processed_image_pil = Image.fromarray(processed_image.cpu().numpy().astype('uint8'), 'RGB')
+    else:
+        processed_image_pil = processed_image
+    image_tensor = transform(processed_image_pil).to(device)
     image_tensor = image_tensor.unsqueeze(0)  # Add a batch dimension
+    return image_tensor, processed_image_pil
 # Function for inference
 def predict(image_tensor, model, device):
     model.eval()
     with torch.no_grad():
         outputs = model(image_tensor)
+        # Adjust for your model's output if it does not have a 'logits' attribute
         probabilities = torch.nn.functional.softmax(outputs.logits, dim=1)
         predicted_class = torch.argmax(probabilities, dim=1)
     return predicted_class, probabilities
+# Streamlit UI setup
 st.title("Face Detection and Classification with ViT")
 st.write("Upload an image, and the model will detect faces and classify the image.")
     image_tensor, final_image = preprocess_image(image, mtcnn, device)
     predicted_class, probabilities = predict(image_tensor, model, device)
+    # Here, customize the display of predicted_class and probabilities based on your model's specifics
     st.write(f"Predicted class: {predicted_class.item()}")
     # Display the final processed image
     st.image(final_image, caption='Processed Image', use_column_width=True)