Spaces:

AMfeta99
/

Object_Evolution_Generator

Runtime error

App Files Files Community

AMfeta99 commited on May 21, 2025

Commit

062d16c

verified ·

1 Parent(s): 9036d72

Update app.py

Browse files

Files changed (1) hide show

app.py +96 -50

app.py CHANGED Viewed

@@ -1,23 +1,28 @@
-from transformers import HfAgent
 from PIL import Image, ImageDraw, ImageFont
 import gradio as gr
-import os
-#%% Utility Functions
 def add_label_to_image(image, label):
     draw = ImageDraw.Draw(image)
-    font_path = "/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf"
-    font_size = 30
     try:
         font = ImageFont.truetype(font_path, font_size)
     except:
         font = ImageFont.load_default()
     text_bbox = draw.textbbox((0, 0), label, font=font)
     text_width, text_height = text_bbox[2] - text_bbox[0], text_bbox[3] - text_bbox[1]
-    position = (image.width - text_width - 20, image.height - text_height - 20)
     rect_margin = 10
     rect_position = [
         position[0] - rect_margin,
@@ -25,77 +30,108 @@ def add_label_to_image(image, label):
         position[0] + text_width + rect_margin,
         position[1] + text_height + rect_margin,
     ]
-    draw.rectangle(rect_position, fill=(0, 0, 0, 128))
     draw.text(position, label, fill="white", font=font)
     return image
-def plot_and_save_agent_image(image, label, save_path=None):
-    labeled_image = add_label_to_image(image, label)
     labeled_image.show()
     if save_path:
         labeled_image.save(save_path)
         print(f"Image saved to {save_path}")
 def generate_prompts_for_object(object_name):
-    return {
         "past": f"Show an old version of a {object_name} from its early days.",
         "present": f"Show a {object_name} with current features/design/technology.",
-        "future": f"Show a futuristic version of a {object_name}, predicting advanced features and design."
     }
-#%% HF Agent Initialization
-agent = HfAgent("https://api-inference.huggingface.co/models/HuggingFaceH4/zephyr-7b-beta")
-#%% Core Generation Function
 def generate_object_history(object_name):
     images = []
-    gif_frames = []
     prompts = generate_prompts_for_object(object_name)
     labels = {
         "past": f"{object_name} - Past",
         "present": f"{object_name} - Present",
         "future": f"{object_name} - Future"
     }
-    output_image_paths = []
-    for period, prompt in prompts.items():
-        print(f"Generating image for: {prompt}")
-        result = agent.run(prompt)
-        # Find first image in result (agent returns a dict)
-        image_path = next((v for v in result.values() if isinstance(v, str) and v.endswith((".png", ".jpg"))), None)
-        if not image_path or not os.path.exists(image_path):
-            raise RuntimeError(f"No valid image generated for {prompt}")
-        image = Image.open(image_path).convert("RGB")
-        labeled_image = add_label_to_image(image, labels[period])
-        filename = f"{object_name}_{period}.png"
-        labeled_image.save(filename)
-        output_image_paths.append((filename, labels[period]))
-        gif_frames.append(labeled_image)
-    # Save animated GIF
-    gif_path = f"{object_name}_evolution.gif"
-    gif_frames[0].save(gif_path, save_all=True, append_images=gif_frames[1:], duration=1000, loop=0)
-    return output_image_paths, gif_path
-#%% Gradio Interface
 def create_gradio_interface():
     with gr.Blocks() as demo:
-        gr.Markdown("# TimeMetamorphy: An Object Evolution Generator")
         gr.Markdown("""
-        Explore how objects change over time — from past, to present, to future.
-        Enter any object below and let AI visualize its transformation through the ages.
         """)
         default_images = [
             ("car_past.png", "Car - Past"),
             ("car_present.png", "Car - Present"),
@@ -105,15 +141,25 @@ def create_gradio_interface():
         with gr.Row():
             with gr.Column():
-                object_name_input = gr.Textbox(label="Enter an object name", placeholder="e.g., bicycle, phone")
                 generate_button = gr.Button("Generate Evolution")
                 image_gallery = gr.Gallery(label="Generated Images", show_label=True, columns=3, rows=1, value=default_images)
-                gif_output = gr.Image(label="Generated GIF", show_label=True, value=default_gif_path)
         generate_button.click(fn=generate_object_history, inputs=[object_name_input], outputs=[image_gallery, gif_output])
     return demo
-# Launch
 demo = create_gradio_interface()
-demo.launch(share=True)

+from transformers import load_tool, ReactCodeAgent, HfApiEngine
 from PIL import Image, ImageDraw, ImageFont
+import tempfile
 import gradio as gr
+#%% Methods
+# Function to add a label to an image
 def add_label_to_image(image, label):
+    # Create a drawing context
     draw = ImageDraw.Draw(image)
+    # Define font size and color (adjust font path for your environment)
+    font_path = "/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf"  # Example font path
+    font_size = 30  # Larger font size for better visibility
     try:
         font = ImageFont.truetype(font_path, font_size)
     except:
         font = ImageFont.load_default()
+    # Calculate the size and position of the text (aligned to the left)
     text_bbox = draw.textbbox((0, 0), label, font=font)
     text_width, text_height = text_bbox[2] - text_bbox[0], text_bbox[3] - text_bbox[1]
+    position = (image.width - text_width - 20, image.height - text_height - 20)# right-aligned with margin
+    # Add a semi-transparent rectangle behind the text for better visibility
     rect_margin = 10
     rect_position = [
         position[0] - rect_margin,
         position[0] + text_width + rect_margin,
         position[1] + text_height + rect_margin,
     ]
+    draw.rectangle(rect_position, fill=(0, 0, 0, 128))  # Semi-transparent black
     draw.text(position, label, fill="white", font=font)
     return image
+# Function to plot, label, and save an image
+def plot_and_save_agent_image(agent_image, label, save_path=None):
+    # Convert AgentImage to a raw PIL Image
+    pil_image = agent_image.to_raw()
+    # Add a label to the image
+    labeled_image = add_label_to_image(pil_image, label)
+    # Plot the image using PIL's show method
     labeled_image.show()
+    # If save_path is provided, save the image
     if save_path:
         labeled_image.save(save_path)
         print(f"Image saved to {save_path}")
+    else:
+        print("No save path provided. Image not saved.")
+# Function to generate prompts for an object
 def generate_prompts_for_object(object_name):
+    prompts = {
         "past": f"Show an old version of a {object_name} from its early days.",
         "present": f"Show a {object_name} with current features/design/technology.",
+        "future": f"Show a futuristic version of a {object_name}, by predicting advanced features and futuristic design."
     }
+    return prompts
+# Function to generate the object's history images and GIF
 def generate_object_history(object_name):
     images = []
+    # Get prompts for the object
     prompts = generate_prompts_for_object(object_name)
     labels = {
         "past": f"{object_name} - Past",
         "present": f"{object_name} - Present",
         "future": f"{object_name} - Future"
     }
+    # Generate sequential images and display them
+    for time_period, frame in prompts.items():
+        print(f"Generating {time_period} frame: {frame}")
+        result = agent.run(frame)  # The tool generates the image
+        # Append the image to the list for GIF creation
+        images.append(result.to_raw())  # Ensure we're using raw image for GIF
+        # Save each image with the appropriate name and label
+        image_filename = f"{object_name}_{time_period}.png"
+        plot_and_save_agent_image(result, labels[time_period], save_path=image_filename)
+    # Create GIF from images
+    gif_path = f"{object_name}_evolution.gif"
+    images[0].save(
+        gif_path,
+        save_all=True,
+        append_images=images[1:],
+        duration=1000,  # Duration in milliseconds for each frame
+        loop=0          # Infinite loop
+    )
+    # Return images and GIF path
+    return images, gif_path
+#%% Initialization of tools and AI_Agent
+# Import text-to-image tool from Hub
+image_generation_tool = load_tool("m-ric/text-to-image", cache=False)
+# Import search tool from LangChain
+from transformers.agents.search import DuckDuckGoSearchTool
+search_tool = DuckDuckGoSearchTool()
+# Load the LLM engine
+llm_engine = HfApiEngine("Qwen/Qwen2.5-72B-Instruct")
+# Initialize the agent with both tools
+agent = ReactCodeAgent(tools=[image_generation_tool, search_tool], llm_engine=llm_engine)
+# Gradio interface
 def create_gradio_interface():
     with gr.Blocks() as demo:
+        gr.Markdown("# TimeMetamorphy: an object Evolution Generator")
+        # Add a section for instructions
         gr.Markdown("""
+        ## Unlocking the secrets of time!
+        This app unveils these mysteries by offering a unique/magic lens that allows us "time travel".
+        Powered by AI agents equipped with cutting-edge tools, it provides the superpower to explore the past, witness the present, and dream up the future like never before.
+        This system allows you to generate visualizations of how an object/concept, like a bicycle or a car, may have evolved over time.
+        It generates images of the object in the past, present, and future based on your input.
+        ### Default Example: Evolution of a Car
+        Below, you can see a precomputed example of a "car" evolution. Enter another object to generate its evolution.
         """)
+        # Paths to the precomputed files
         default_images = [
             ("car_past.png", "Car - Past"),
             ("car_present.png", "Car - Present"),
         with gr.Row():
             with gr.Column():
+                # Textbox for user to input an object name
+                object_name_input = gr.Textbox(label="Enter an object name (e.g., bicycle, phone)",
+                                              placeholder="Enter an object name",
+                                              lines=1)
+                # Button to trigger the generation of images and GIF
                 generate_button = gr.Button("Generate Evolution")
+                # Gradio Gallery component to display the images
                 image_gallery = gr.Gallery(label="Generated Images", show_label=True, columns=3, rows=1, value=default_images)
+                # Output for the generated GIF
+                gif_output = gr.Image(label="Generated GIF", show_label=True, value=default_gif_path)
+        # Set the action when the button is clicked
         generate_button.click(fn=generate_object_history, inputs=[object_name_input], outputs=[image_gallery, gif_output])
     return demo
+# Launch the Gradio app
 demo = create_gradio_interface()
+demo.launch(share=True)