GroundTruth-AI-dev

Sleeping

App Files Files Community

grixelle commited on 28 days ago

Commit

92d5279

verified ·

1 Parent(s): 6dffb88

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -20

app.py CHANGED Viewed

@@ -13,30 +13,35 @@ def ground_truth_engine(past_img, present_img, audit_level, progress=gr.Progress
     if past_img is None or present_img is None:
         return "Please upload both images."
-    # Map Slider to API 'thinking_budget'
-    # Quick = Low budget, Forensic = High budget
-    budget_map = {"Quick Scan": 100, "Standard Audit": 400, "Deep Forensic": 1000}
-    selected_budget = budget_map.get(audit_level, 400)
-    progress(0.2, desc=f"Level: {audit_level} (Budget: {selected_budget})")
     prompt = f"""
-    Perform a {audit_level} structural audit.
-    Compare roofing, landscaping, and exterior condition.
-    Provide precise physical evidence for changes.
-    Conclude with 'Maintenance Trajectory': IMPROVING, STABLE, or DECLINING.
     """
     try:
-        progress(0.5, desc="Robotics-ER is reasoning spatially...")
-        # We pass the audit level intent into the generation config
         response = client.models.generate_content(
             model="gemini-robotics-er-1.5-preview",
-            contents=[prompt, past_img, present_img],
-            config={
-                "thinking_budget": selected_budget
-            }
         )
         progress(1.0, desc="Audit Complete!")
@@ -51,18 +56,15 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         with gr.Column():
             p_img = gr.Image(label="Past Condition", type="pil")
             c_img = gr.Image(label="Current Condition", type="pil")
-            # New UI Element: Audit Level Slider
             audit_slider = gr.Radio(
                 choices=["Quick Scan", "Standard Audit", "Deep Forensic"],
                 value="Standard Audit",
-                label="Audit Depth (Robotics Reasoning Level)"
             )
             submit = gr.Button("Analyze Structural Trajectory", variant="primary")
         with gr.Column():
-            output = gr.Markdown(label="Audit Report")
     submit.click(
         fn=ground_truth_engine,

     if past_img is None or present_img is None:
         return "Please upload both images."
+    # Directives updated to request normalized coordinates (0-1000)
+    audit_directives = {
+        "Quick Scan": "Perform a rapid structural overview.",
+        "Standard Audit": "Compare roofing, landscaping, and exterior siding.",
+        "Deep Forensic": """Perform an exhaustive spatial audit.
+        For the 3 most significant structural changes, identify their center points
+        using normalized [y, x] coordinates (0-1000).
+        Identify subtle shingle wear, foundation cracks, and biological encroachment."""
+    }
+    selected_directive = audit_directives.get(audit_level, audit_directives["Standard Audit"])
+    progress(0.2, desc=f"Mode: {audit_level}")
     prompt = f"""
+    SYSTEM INSTRUCTION: You are a forensic structural appraiser using spatial grounding.
+    DIRECTIVE: {selected_directive}
+    TASK: Compare these images.
+    1. List the structural findings.
+    2. Provide the [y, x] coordinates for points of interest if in Deep Forensic mode.
+    3. Conclude with 'Maintenance Trajectory': IMPROVING, STABLE, or DECLINING.
     """
     try:
+        progress(0.5, desc="Robotics-ER is calculating spatial points...")
         response = client.models.generate_content(
             model="gemini-robotics-er-1.5-preview",
+            contents=[prompt, past_img, present_img]
         )
         progress(1.0, desc="Audit Complete!")
         with gr.Column():
             p_img = gr.Image(label="Past Condition", type="pil")
             c_img = gr.Image(label="Current Condition", type="pil")
             audit_slider = gr.Radio(
                 choices=["Quick Scan", "Standard Audit", "Deep Forensic"],
                 value="Standard Audit",
+                label="Audit Depth"
             )
             submit = gr.Button("Analyze Structural Trajectory", variant="primary")
         with gr.Column():
+            output = gr.Markdown(label="Forensic Audit Report")
     submit.click(
         fn=ground_truth_engine,