Spaces:

halictus
/

honey-bee-identification

Sleeping

File size: 8,351 Bytes

from fastapi import FastAPI, UploadFile, File, HTTPException
from pydantic import BaseModel
import uvicorn
import io
import logging
import datetime
import re
import os
import requests
import pandas as pd
from PIL import Image
from autogluon.multimodal import MultiModalPredictor
from huggingface_hub import snapshot_download

###############################################################################
# Logging configuration (optional)
###############################################################################
log_filename = "model_predictions.log"
logging.basicConfig(
    filename=log_filename, 
    level=logging.INFO, 
    format='%(asctime)s - %(message)s'
)

###############################################################################
# Model loading
###############################################################################
def load_model():
    """
    Downloads the model from the specified huggingface hub repo and 
    loads it using MultiModalPredictor.
    """
    repo_id = "Honey-Bee-Society/honeybee_ml_v1"
    local_dir = snapshot_download(repo_id)

    assets_path = os.path.join(local_dir, "assets.json")
    model_checkpoint = os.path.join(local_dir, "model.ckpt")

    if not os.path.exists(assets_path) or not os.path.exists(model_checkpoint):
        raise FileNotFoundError("Required model files not found in the downloaded directory.")

    predictor = MultiModalPredictor.load(local_dir)
    return predictor

###############################################################################
# Image processing and prediction routines
###############################################################################
def resize_image_proportionally(image, max_size_mb=1):
    """
    If the in-memory size of the image is > max_size_mb, 
    resize it proportionally.
    """
    img_byte_array = io.BytesIO()
    image.save(img_byte_array, format='PNG')
    img_size = len(img_byte_array.getvalue()) / (1024 * 1024)

    if img_size > max_size_mb:
        scale_factor = (max_size_mb / img_size) ** 0.5
        new_width = int(image.width * scale_factor)
        new_height = int(image.height * scale_factor)
        image = image.resize((new_width, new_height))

    return image


def predict_image(image: Image.Image, predictor: MultiModalPredictor):
    """
    Run the prediction via the AutoGluon MultiModalPredictor. 
    Returns probability dataframe for each class.
    """
    img_byte_array = io.BytesIO()
    image.save(img_byte_array, format='PNG')
    img_data = img_byte_array.getvalue()
    df = pd.DataFrame({"image": [img_data]})
    probabilities = predictor.predict_proba(df, realtime=True)
    return probabilities


def determine_label(probabilities):
    """
    Given the probabilities DataFrame, compute the final label.
    Returns a dict with numeric scores and a text label.
    """
    honeybee_score = float(probabilities[1].iloc[0]) * 100
    bumblebee_score = float(probabilities[2].iloc[0]) * 100
    vespidae_score = float(probabilities[3].iloc[0]) * 100

    highest_score = max(honeybee_score, bumblebee_score, vespidae_score)
    if highest_score < 80:
        prediction_label = "No bee detected (scores too low)."
    else:
        if honeybee_score == highest_score:
            prediction_label = "Honey Bee"
        elif bumblebee_score == highest_score:
            prediction_label = "Bumblebee"
        else:
            prediction_label = "Vespidae (wasp/hornet)"

    return {
        "honeybee_score": honeybee_score,
        "bumblebee_score": bumblebee_score,
        "vespidae_score": vespidae_score,
        "prediction_label": prediction_label
    }


def log_predictions(honeybee_score, bumblebee_score, vespidae_score, source_info):
    """
    Log predictions to a file (optional).
    """
    logging.info(
        f"Source: {source_info}, "
        f"Honeybee: {honeybee_score:.2f}%, "
        f"Bumblebee: {bumblebee_score:.2f}%, "
        f"Vespidae: {vespidae_score:.2f}%"
    )

###############################################################################
# Request models
###############################################################################
class ImageUrlRequest(BaseModel):
    image_url: str

###############################################################################
# FastAPI app and endpoints
###############################################################################
app = FastAPI(title="Honey Bee Classification API")

# Load the model at startup (only once).
predictor = load_model()

@app.get("/ping")
def ping():
    """
    A simple endpoint to check if the API is running.
    """
    return {"message": "pong"}

@app.post("/predict")
async def predict_endpoint(
    image_url_req: ImageUrlRequest = None,
    file: UploadFile = File(None)
):
    """
    Accepts either a JSON body with `image_url` or a multipart form-data `file`.
    Returns JSON with honeybee, bumblebee, vespidae scores, and a predicted label.
    """
    # 1) If user provided an image URL
    if image_url_req and image_url_req.image_url:
        image_url = image_url_req.image_url
        # Download the image
        try:
            response = requests.get(
                image_url, 
                headers={"User-Agent": "HoneyBeeClassification/1.0 (+https://example.com)"}
            )
            if response.status_code != 200:
                raise HTTPException(
                    status_code=400, 
                    detail=f"Failed to retrieve image from {image_url}. HTTP {response.status_code}"
                )
        except Exception as e:
            raise HTTPException(
                status_code=400, 
                detail=f"Error downloading image from {image_url}: {e}"
            )
        
        image_bytes = response.content
        image_size_mb = len(image_bytes) / (1024*1024)
        if image_size_mb > 10:
            raise HTTPException(
                status_code=413,
                detail=f"Image size {image_size_mb:.2f}MB exceeds 10MB limit."
            )
        # Convert to PIL Image
        try:
            image = Image.open(io.BytesIO(image_bytes))
        except Exception as e:
            raise HTTPException(
                status_code=400, 
                detail=f"Could not open image: {e}"
            )
        
        # 2) If user instead provided a file
    elif file is not None:
        # Check file size
        file_size = 0
        file.file.seek(0, 2)  # move to end
        file_size = file.file.tell()
        file.file.seek(0)     # reset pointer
        mb_size = file_size / (1024 * 1024)
        if mb_size > 10:
            raise HTTPException(
                status_code=413,
                detail=f"Uploaded file size {mb_size:.2f}MB exceeds 10MB limit."
            )
        
        # Convert to PIL Image
        try:
            contents = await file.read()
            image = Image.open(io.BytesIO(contents))
        except Exception as e:
            raise HTTPException(
                status_code=400, 
                detail=f"Could not open uploaded image: {e}"
            )
        source_info = f"uploaded_file:{file.filename}"
    else:
        raise HTTPException(
            status_code=400, 
            detail="No image provided. Supply either `image_url` or `file`."
        )

    # Resize the image if needed
    image = resize_image_proportionally(image)

    # Predict
    try:
        probabilities = predict_image(image, predictor)
        results = determine_label(probabilities)
    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Prediction failed: {e}"
        )

    # Optionally log predictions
    source_name = image_url_req.image_url if (image_url_req and image_url_req.image_url) else file.filename
    log_predictions(
        results["honeybee_score"],
        results["bumblebee_score"],
        results["vespidae_score"],
        source_info=source_name
    )

    return results


# If running locally, uncomment to start the server via `python app.py`
# (On Hugging Face Spaces, a separate command may be used.)
# if __name__ == "__main__":
#     uvicorn.run(app, host="0.0.0.0", port=7860)
if __name__ == "__main__":
    import uvicorn
    import os

    port = int(os.environ.get("PORT", 7860))
    uvicorn.run(app, host="0.0.0.0", port=port)