Spaces:

NHMUK
/

MATCHA

Sleeping

App Files Files Community

Chris Addis commited on Apr 28, 2025

Commit

2c8a1cc

1 Parent(s): 12bfe0c

Advanced settings

Browse files

Files changed (1) hide show

app.py +106 -25

app.py CHANGED Viewed

@@ -36,6 +36,20 @@ PREFERENCES_FILE = "data/user_preferences.csv"
 # Ensure directory exists
 os.makedirs(os.path.dirname(PREFERENCES_FILE), exist_ok=True)
 def get_sys_prompt(length="medium", photograph=False):
     extra_prompt = ""
@@ -107,7 +121,21 @@ def create_demo():
     """
     # --- Pass css to gr.Blocks ---
     with gr.Blocks(theme=gr.themes.Monochrome(), css=custom_css) as demo:
-        # [existing header rows remain the same]
         with gr.Row():
             # Left column: Controls and uploads
@@ -118,8 +146,8 @@ def create_demo():
                     file_count="multiple"
                 )
-                # Main model choices - limited selection
-                main_model_choices = [
                     ("Gemini 2.0 Flash (default)", "google/gemini-2.0-flash-001"),
                     ("GPT-4.1 Mini", "gpt-4.1-mini"),
                     ("GPT-4.1", "gpt-4.1"),
@@ -128,30 +156,36 @@ def create_demo():
                     ("Gemini 2.5 Flash Thinking", "google/gemini-2.5-flash-preview:thinking")
                 ]
                 default_model_internal_value = "google/gemini-2.0-flash-001"
                 model_choice = gr.Dropdown(
-                    choices=main_model_choices, label="Select Model",
-                    value=default_model_internal_value, visible=True
                 )
                 length_choice = gr.Radio(
-                    choices=["short", "medium", "long"], label="Response Length",
-                    value="medium", info="Short: max 130 chars | Medium: 250-300 chars | Long: max 450 chars"
                 )
                 # Advanced settings accordion
                 with gr.Accordion("Advanced Settings", open=False):
-                    # Additional model choices for advanced users
-                    advanced_model_choices = [
-                        ("GPT-4.1 Nano", "gpt-4.1-nano"),
-                        ("ChatGPT Latest", "openai/chatgpt-4o-latest"),
-                        ("Llama 4 Maverick", "meta-llama/llama-4-maverick")
-                    ]
-                    advanced_model_choice = gr.Dropdown(
-                        choices=advanced_model_choices,
-                        label="Additional Models",
-                        value=None
                     )
                     content_type = gr.Radio(
@@ -159,8 +193,15 @@ def create_demo():
                         label="Content Type",
                         value="Museum Object"
                     )
-                # [rest of the interface remains the same]
                 gr.Markdown("### Uploaded Images")
                 input_gallery = gr.Gallery(
                     label="Uploaded Image Previews", columns=3, height=150,
@@ -198,7 +239,50 @@ def create_demo():
                 all_images = gr.State([])
                 all_results = gr.State([])
-        # --- Functions (handle_upload, analyze_images, navigators) remain the same ---
         # Handle file uploads
         def handle_upload(files, current_paths, current_filenames):
             file_paths = []
@@ -217,13 +301,10 @@ def create_demo():
         )
         # Analyze images
-        def analyze_images(image_paths, main_model, adv_model, length_choice, filenames, content_type_choice):
             if not image_paths:
                 return [], [], 0, None, "0 of 0", "No images uploaded to analyze.", None
-            # Determine which model to use (advanced model takes precedence if selected)
-            model_choice = adv_model if adv_model else main_model
             is_photography = content_type_choice == "Photography"
             sys_prompt = get_sys_prompt(length_choice, photograph=is_photography)
             image_results = []
@@ -278,7 +359,7 @@ def create_demo():
         # Connect analyze button
         analyze_button.click(
             fn=analyze_images,
-            inputs=[image_state, model_choice, advanced_model_choice, length_choice, filename_state, content_type],
             outputs=[all_images, all_results, current_index, current_image, image_counter,
                      analysis_text, csv_download]
         )

 # Ensure directory exists
 os.makedirs(os.path.dirname(PREFERENCES_FILE), exist_ok=True)
+# Define model pricing information (approximate costs per 100 image API calls)
+# These are placeholder values - replace with actual pricing
+MODEL_PRICING = {
+    "google/gemini-2.0-flash-001": {"cost": "$0.50", "speed": "Fast"},
+    "gpt-4.1-mini": {"cost": "$2.00", "speed": "Medium"},
+    "gpt-4.1": {"cost": "$5.00", "speed": "Medium-Slow"},
+    "anthropic/claude-3.7-sonnet": {"cost": "$4.00", "speed": "Medium"},
+    "google/gemini-2.5-pro-preview-03-25": {"cost": "$1.50", "speed": "Medium"},
+    "google/gemini-2.5-flash-preview:thinking": {"cost": "$0.75", "speed": "Fast"},
+    "gpt-4.1-nano": {"cost": "$1.00", "speed": "Fast"},
+    "openai/chatgpt-4o-latest": {"cost": "$4.50", "speed": "Medium-Slow"},
+    "meta-llama/llama-4-maverick": {"cost": "$0.25", "speed": "Medium"}
+}
 def get_sys_prompt(length="medium", photograph=False):
     extra_prompt = ""
     """
     # --- Pass css to gr.Blocks ---
     with gr.Blocks(theme=gr.themes.Monochrome(), css=custom_css) as demo:
+        with gr.Row():
+            with gr.Column(scale=3):
+                gr.Markdown("# MATCHA: Museum Alt-Text for Cultural Heritage with AI 🍵 🌿")
+                gr.Markdown("Upload one or more images to generate accessible alternative text (designed to meet WCAG Guidelines)")
+                gr.Markdown("Developed by the Natural History Museum in Partnership with National Museums Liverpool. Funded by the DCMS Pilot Scheme")
+            with gr.Column(scale=1):
+                with gr.Row():
+                    gr.Image("images/nhm_logo.png", show_label=False, height=120,
+                             interactive=False, show_download_button=False,
+                             show_share_button=False, show_fullscreen_button=False,
+                             container=False, elem_id="nhm-logo")
+                    gr.Image("images/nml_logo.png", show_label=False, height=120,
+                             interactive=False, show_download_button=False,
+                             show_share_button=False, show_fullscreen_button=False,
+                             container=False, elem_id="nml-logo")
         with gr.Row():
             # Left column: Controls and uploads
                     file_count="multiple"
                 )
+                # Define preferred and additional models
+                preferred_models = [
                     ("Gemini 2.0 Flash (default)", "google/gemini-2.0-flash-001"),
                     ("GPT-4.1 Mini", "gpt-4.1-mini"),
                     ("GPT-4.1", "gpt-4.1"),
                     ("Gemini 2.5 Flash Thinking", "google/gemini-2.5-flash-preview:thinking")
                 ]
+                additional_models = [
+                    ("GPT-4.1 Nano", "gpt-4.1-nano"),
+                    ("ChatGPT Latest", "openai/chatgpt-4o-latest"),
+                    ("Llama 4 Maverick", "meta-llama/llama-4-maverick")
+                ]
+                # Default model
                 default_model_internal_value = "google/gemini-2.0-flash-001"
+                # Model dropdown (will be updated dynamically)
                 model_choice = gr.Dropdown(
+                    choices=preferred_models,
+                    label="Select Model",
+                    value=default_model_internal_value,
+                    visible=True
                 )
                 length_choice = gr.Radio(
+                    choices=["short", "medium", "long"],
+                    label="Response Length",
+                    value="medium",
+                    info="Short: max 130 chars | Medium: 250-300 chars | Long: max 450 chars"
                 )
                 # Advanced settings accordion
                 with gr.Accordion("Advanced Settings", open=False):
+                    show_all_models = gr.Checkbox(
+                        label="Show Additional Models",
+                        value=False,
+                        info="Display additional model options in the dropdown above"
                     )
                     content_type = gr.Radio(
                         label="Content Type",
                         value="Museum Object"
                     )
+                    # Display current model info
+                    model_info = gr.Markdown(
+                        """**Current Model**: Gemini 2.0 Flash
+                        **Cost per 100 Images**: $0.50
+                        **Speed**: Fast""",
+                        label="Model Information"
+                    )
                 gr.Markdown("### Uploaded Images")
                 input_gallery = gr.Gallery(
                     label="Uploaded Image Previews", columns=3, height=150,
                 all_images = gr.State([])
                 all_results = gr.State([])
+        # --- Functions for model selection and display ---
+        # Update dropdown based on checkbox
+        def update_model_dropdown(show_all, current_model):
+            if show_all:
+                # Combine preferred and additional models
+                all_models = preferred_models + additional_models
+                return gr.Dropdown.update(choices=all_models, value=current_model)
+            else:
+                # Only show preferred models
+                # If current model is not in preferred, switch to default
+                current_model_in_preferred = any(model[1] == current_model for model in preferred_models)
+                if not current_model_in_preferred:
+                    return gr.Dropdown.update(choices=preferred_models, value=default_model_internal_value)
+                return gr.Dropdown.update(choices=preferred_models, value=current_model)
+        # Update model info display
+        def update_model_info(model_id):
+            # Find the display name for the model ID
+            model_name = next((name for name, id in preferred_models + additional_models if id == model_id), "Unknown Model")
+            # Get pricing info
+            pricing_info = MODEL_PRICING.get(model_id, {"cost": "Unknown", "speed": "Unknown"})
+            # Create markdown text
+            info_text = f"""**Current Model**: {model_name}
+            **Cost per 100 Images**: {pricing_info['cost']}
+            **Speed**: {pricing_info['speed']}"""
+            return info_text
+        # Connect checkbox to update dropdown
+        show_all_models.change(
+            fn=update_model_dropdown,
+            inputs=[show_all_models, model_choice],
+            outputs=[model_choice]
+        )
+        # Connect model dropdown to update info display
+        model_choice.change(
+            fn=update_model_info,
+            inputs=[model_choice],
+            outputs=[model_info]
+        )
         # Handle file uploads
         def handle_upload(files, current_paths, current_filenames):
             file_paths = []
         )
         # Analyze images
+        def analyze_images(image_paths, model_choice, length_choice, filenames, content_type_choice):
             if not image_paths:
                 return [], [], 0, None, "0 of 0", "No images uploaded to analyze.", None
             is_photography = content_type_choice == "Photography"
             sys_prompt = get_sys_prompt(length_choice, photograph=is_photography)
             image_results = []
         # Connect analyze button
         analyze_button.click(
             fn=analyze_images,
+            inputs=[image_state, model_choice, length_choice, filename_state, content_type],
             outputs=[all_images, all_results, current_index, current_image, image_counter,
                      analysis_text, csv_download]
         )