Spaces:

halictus
/

bee_ml_1

Sleeping

App Files Files Community

JackRabbit commited on Feb 2, 2025

Commit

b644be2

1 Parent(s): 2995c7a

api updates

Browse files

Files changed (1) hide show

app.py +39 -75

app.py CHANGED Viewed

@@ -14,34 +14,23 @@ import re
 log_filename = "model_predictions.log"
 logging.basicConfig(filename=log_filename, level=logging.INFO, format='%(asctime)s - %(message)s')
-# Set the page to wide mode
-st.set_page_config(page_title="Honey Bee Image Classification")
-# -------------------------
-# MODEL LOADING
-# -------------------------
 @st.cache_resource
 def load_model():
     repo_id = "Honey-Bee-Society/honeybee_ml_v1"
-    # Download the model files from Hugging Face
     local_dir = snapshot_download(repo_id)
-    # Ensure the necessary files exist in the local directory
     assets_path = os.path.join(local_dir, "assets.json")
     model_checkpoint = os.path.join(local_dir, "model.ckpt")
     if not os.path.exists(assets_path) or not os.path.exists(model_checkpoint):
         raise FileNotFoundError("Required model files not found in the downloaded directory.")
-    # Load the model using the downloaded directory path
     return MultiModalPredictor.load(local_dir)
-# -------------------------
-# HELPER FUNCTIONS
-# -------------------------
 def resize_image_proportionally(image, max_size_mb=1):
-    """Resize the image if it exceeds max_size_mb in memory."""
     img_byte_array = io.BytesIO()
     image.save(img_byte_array, format='PNG')
     img_size = len(img_byte_array.getvalue()) / (1024 * 1024)
@@ -55,7 +44,6 @@ def resize_image_proportionally(image, max_size_mb=1):
     return image
 def predict_image(image, predictor):
-    """Predict probabilities for an in-memory PIL image using the given predictor."""
     img_byte_array = io.BytesIO()
     image.save(img_byte_array, format='PNG')
     img_data = img_byte_array.getvalue()
@@ -64,23 +52,19 @@ def predict_image(image, predictor):
     return probabilities
 def save_image(image, img_name, target_size_kb=500):
-    """Compress and save the image to ensure it is <= target_size_kb KB."""
     processed_image_path = os.path.join("processed_images", img_name)
     if not os.path.exists("processed_images"):
         os.makedirs("processed_images")
-    quality = 95  # Start with high quality
     img_byte_array = io.BytesIO()
-    while quality > 10:  # Stop if quality gets too low
         img_byte_array.seek(0)
         image.save(img_byte_array, format='JPEG', quality=quality)
         img_size_kb = len(img_byte_array.getvalue()) / 1024
         if img_size_kb <= target_size_kb:
             break
         quality -= 5
     with open(processed_image_path, "wb") as f:
@@ -97,12 +81,10 @@ def log_predictions(image_path, honeybee_score, bumblebee_score, vespidae_score)
     )
 def sanitize_filename(filename):
-    """Remove unsafe characters from filenames."""
     safe_filename = re.sub(r'[^A-Za-z0-9_.-]', '_', filename)
     return safe_filename
 def check_file_size(uploaded_file, max_size_mb=10):
-    """Return False if file size exceeds `max_size_mb`."""
     uploaded_file.seek(0, os.SEEK_END)
     file_size = uploaded_file.tell() / (1024 * 1024)
     uploaded_file.seek(0)
@@ -111,27 +93,28 @@ def check_file_size(uploaded_file, max_size_mb=10):
         return False
     return True
-# -------------------------
-# API HANDLER
-# -------------------------
 def run_api(predictor):
     """
-    A simple 'API-like' endpoint in Streamlit.
-    Usage example:
-    ?api=1&image_url=https://somewhere.com/bee.jpg
     """
-    params = st.query_params  # Replaced st.experimental_get_query_params with st.query_params
-    # image_url = params.get("image_url", )
-    image_url = params.get("image_url")
-    st.write("DEBUG: We are inside run_api()!")
-    st.write("DEBUG: st.query_params:", params)
     if not image_url:
-        st.json({"error": "No 'image_url' provided. Example: ?api=1&image_url=<URL>"})
-        return
     # Download the image
     response = requests.get(
@@ -141,23 +124,23 @@ def run_api(predictor):
     if response.status_code != 200:
         st.json({"error": f"Failed to retrieve image from {image_url}. HTTP {response.status_code}"})
-        return
     image_bytes = response.content
-    # Check file size (limit 10MB as in the UI)
     image_size_mb = len(image_bytes)/(1024*1024)
     if image_size_mb > 10:
         st.json({"error": f"Image size {image_size_mb:.2f}MB exceeds 10MB limit."})
-        return
-    # Convert to PIL for processing
     try:
         image = Image.open(io.BytesIO(image_bytes))
     except Exception as e:
         st.json({"error": f"Could not open image: {e}"})
-        return
-    # Optional: resize to keep memory usage low (same logic as UI)
     image = resize_image_proportionally(image)
     # Predict
@@ -168,7 +151,7 @@ def run_api(predictor):
         vespidae_score = float(probabilities[3].iloc[0]) * 100
     except Exception as e:
         st.json({"error": f"Prediction failed: {e}"})
-        return
     # Determine highest-scoring label
     highest_score = max(honeybee_score, bumblebee_score, vespidae_score)
@@ -182,35 +165,28 @@ def run_api(predictor):
         else:
             prediction_label = "Vespidae (wasp/hornet)"
-    # Return results as JSON
     st.json({
         "honeybee_score": honeybee_score,
         "bumblebee_score": bumblebee_score,
         "vespidae_score": vespidae_score,
         "prediction_label": prediction_label
     })
-# -------------------------
-# UI HANDLER
-# -------------------------
 def run_ui(predictor):
     st.title("Honey Bee Image Classification")
-    # File uploader
     uploaded_file = st.file_uploader(
-        "Upload a photo of the suspected bee to see if you have honey bees. :bee:",
         type=["png", "jpg", "jpeg"]
     )
     with st.expander("ML Model Details"):
         st.write("""
-            We trained a MultiModalPredictor from the AutoGluon library to classify images of bees,
-            focusing primarily on Honey Bees. The model is fine-tuned on a curated dataset from inaturalist
-            images (70k+ images) with an accuracy of ~97.5%. It classifies the image as Honey Bee, Bumblebee,
-            or a Vespidae (wasp/hornet).
-            **Open Source**:
-            [Honey-Bee-Society/honeybee_ml_v1](https://huggingface.co/Honey-Bee-Society/honeybee_ml_v1)
         """)
     if uploaded_file is not None:
@@ -227,50 +203,38 @@ def run_ui(predictor):
                 bumblebee_score = float(probabilities[2].iloc[0]) * 100
                 vespidae_score = float(probabilities[3].iloc[0]) * 100
-                # Generate a safe and unique filename
                 timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
                 sanitized_filename = sanitize_filename(uploaded_file.name)
                 img_name = f"processed_{sanitized_filename}_{timestamp}.jpg"
-                # Save compressed image
                 image_path = save_image(image, img_name)
-                # Log predictions
                 log_predictions(image_path, honeybee_score, bumblebee_score, vespidae_score)
-                # Find highest score
                 highest_score = max(honeybee_score, bumblebee_score, vespidae_score)
-                # Display result
                 if highest_score < 80:
-                    st.warning("We are fairly confident there is no bee in this photo. Try another image.")
                 else:
                     if honeybee_score == highest_score:
                         st.success("Yes! This is a honey bee!")
                     elif bumblebee_score == highest_score:
-                        st.info("This is likely a bumblebee, not a honey bee.")
                     else:
-                        st.info("This is likely a member of the vespidae family (wasp, hornet, etc.).")
             except Exception as e:
                 st.error(f"An error occurred: {e}")
             finally:
                 progress_bar.empty()
-# -------------------------
-# MAIN ENTRY POINT
-# -------------------------
 def main():
     predictor = load_model()
-    # Check if we're in "API mode" or "UI mode"
-    query_params = st.query_params  # Replaced st.experimental_get_query_params with st.query_params
     if "api" in query_params:
-        # Run as an API (no UI)
         run_api(predictor)
     else:
-        # Run the standard UI
         run_ui(predictor)
 if __name__ == '__main__':

 log_filename = "model_predictions.log"
 logging.basicConfig(filename=log_filename, level=logging.INFO, format='%(asctime)s - %(message)s')
+# Set the page config
+st.set_page_config(page_title="Honey Bee Image Classification", layout="wide")
 @st.cache_resource
 def load_model():
     repo_id = "Honey-Bee-Society/honeybee_ml_v1"
     local_dir = snapshot_download(repo_id)
     assets_path = os.path.join(local_dir, "assets.json")
     model_checkpoint = os.path.join(local_dir, "model.ckpt")
     if not os.path.exists(assets_path) or not os.path.exists(model_checkpoint):
         raise FileNotFoundError("Required model files not found in the downloaded directory.")
     return MultiModalPredictor.load(local_dir)
 def resize_image_proportionally(image, max_size_mb=1):
     img_byte_array = io.BytesIO()
     image.save(img_byte_array, format='PNG')
     img_size = len(img_byte_array.getvalue()) / (1024 * 1024)
     return image
 def predict_image(image, predictor):
     img_byte_array = io.BytesIO()
     image.save(img_byte_array, format='PNG')
     img_data = img_byte_array.getvalue()
     return probabilities
 def save_image(image, img_name, target_size_kb=500):
     processed_image_path = os.path.join("processed_images", img_name)
     if not os.path.exists("processed_images"):
         os.makedirs("processed_images")
+    quality = 95
     img_byte_array = io.BytesIO()
+    while quality > 10:
         img_byte_array.seek(0)
         image.save(img_byte_array, format='JPEG', quality=quality)
         img_size_kb = len(img_byte_array.getvalue()) / 1024
         if img_size_kb <= target_size_kb:
             break
         quality -= 5
     with open(processed_image_path, "wb") as f:
     )
 def sanitize_filename(filename):
     safe_filename = re.sub(r'[^A-Za-z0-9_.-]', '_', filename)
     return safe_filename
 def check_file_size(uploaded_file, max_size_mb=10):
     uploaded_file.seek(0, os.SEEK_END)
     file_size = uploaded_file.tell() / (1024 * 1024)
     uploaded_file.seek(0)
         return False
     return True
 def run_api(predictor):
     """
+    'API mode' for this Streamlit app.
+    Expects a query param ?api=1&image_url=<PUBLIC_IMAGE_URL>
+    Example usage (from command line):
+        curl -X GET "https://your-username-your-app.hf.space/?api=1&image_url=https://raw.githubusercontent.com/yourimage.jpg"
+    The response is HTML with an embedded JSON, but you can often parse it directly in Python:
+        >>> import requests
+        >>> response = requests.get("https://your-username-your-app.hf.space/?api=1&image_url=...")
+        >>> print(response.text)       # prints the entire HTML with JSON
+        # or sometimes:
+        >>> data = response.json()     # may work depending on how the client interprets the response
+        >>> print(data)
     """
+    params = st.experimental_get_query_params()  # or st.query_params in Streamlit 1.19+
+    image_url = params.get("image_url", [None])[0]
     if not image_url:
+        st.json({"error": "No 'image_url' provided. Usage: ?api=1&image_url=<URL>"})
+        st.stop()
     # Download the image
     response = requests.get(
     if response.status_code != 200:
         st.json({"error": f"Failed to retrieve image from {image_url}. HTTP {response.status_code}"})
+        st.stop()
     image_bytes = response.content
+    # Check file size (limit 10MB)
     image_size_mb = len(image_bytes)/(1024*1024)
     if image_size_mb > 10:
         st.json({"error": f"Image size {image_size_mb:.2f}MB exceeds 10MB limit."})
+        st.stop()
+    # Convert to PIL
     try:
         image = Image.open(io.BytesIO(image_bytes))
     except Exception as e:
         st.json({"error": f"Could not open image: {e}"})
+        st.stop()
+    # Resize
     image = resize_image_proportionally(image)
     # Predict
         vespidae_score = float(probabilities[3].iloc[0]) * 100
     except Exception as e:
         st.json({"error": f"Prediction failed: {e}"})
+        st.stop()
     # Determine highest-scoring label
     highest_score = max(honeybee_score, bumblebee_score, vespidae_score)
         else:
             prediction_label = "Vespidae (wasp/hornet)"
+    # Return results as JSON and stop further Streamlit processing
     st.json({
         "honeybee_score": honeybee_score,
         "bumblebee_score": bumblebee_score,
         "vespidae_score": vespidae_score,
         "prediction_label": prediction_label
     })
+    st.stop()
 def run_ui(predictor):
     st.title("Honey Bee Image Classification")
     uploaded_file = st.file_uploader(
+        "Upload a photo of the suspected bee...",
         type=["png", "jpg", "jpeg"]
     )
     with st.expander("ML Model Details"):
         st.write("""
+            We trained a MultiModalPredictor to classify bee images
+            (Honey Bee, Bumblebee, or Vespidae).
+            Accuracy is ~97.5% on our test set.
         """)
     if uploaded_file is not None:
                 bumblebee_score = float(probabilities[2].iloc[0]) * 100
                 vespidae_score = float(probabilities[3].iloc[0]) * 100
                 timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
                 sanitized_filename = sanitize_filename(uploaded_file.name)
                 img_name = f"processed_{sanitized_filename}_{timestamp}.jpg"
                 image_path = save_image(image, img_name)
                 log_predictions(image_path, honeybee_score, bumblebee_score, vespidae_score)
                 highest_score = max(honeybee_score, bumblebee_score, vespidae_score)
                 if highest_score < 80:
+                    st.warning("We are fairly confident there is no bee in this photo.")
                 else:
                     if honeybee_score == highest_score:
                         st.success("Yes! This is a honey bee!")
                     elif bumblebee_score == highest_score:
+                        st.info("Likely a bumblebee, not a honey bee.")
                     else:
+                        st.info("Likely a wasp/hornet (vespidae).")
             except Exception as e:
                 st.error(f"An error occurred: {e}")
             finally:
                 progress_bar.empty()
 def main():
     predictor = load_model()
+    # Decide whether we are in 'API mode' or normal UI mode
+    query_params = st.experimental_get_query_params()
     if "api" in query_params:
         run_api(predictor)
     else:
         run_ui(predictor)
 if __name__ == '__main__':