Spaces:

DvorakInnovationAI
/

GenAI-FASTAPI

Sleeping

App Files Files Community

subashpoudel commited on Jun 29, 2025

Commit

fa8520f

1 Parent(s): 3c1150c

Next commit

Browse files

Files changed (12) hide show

__pycache__/main.cpython-312.pyc +0 -0
brainstroming_agent/utils/__pycache__/nodes.cpython-312.pyc +0 -0
brainstroming_agent/utils/__pycache__/prompts.cpython-312.pyc +0 -0
brainstroming_agent/utils/nodes.py +1 -1
brainstroming_agent/utils/prompts.py +1 -1
context_analysis_agent/utils/__pycache__/prompts.cpython-312.pyc +0 -0
context_analysis_agent/utils/prompts.py +1 -0
main.py +11 -25
orchestration_agent/agent.py +10 -4
orchestration_agent/utils/prompts.py +29 -13
orchestration_agent/utils/state.py +1 -0
orchestration_agent/utils/utils.py +38 -0

__pycache__/main.cpython-312.pyc CHANGED Viewed

Binary files a/__pycache__/main.cpython-312.pyc and b/__pycache__/main.cpython-312.pyc differ

brainstroming_agent/utils/__pycache__/nodes.cpython-312.pyc CHANGED Viewed

Binary files a/brainstroming_agent/utils/__pycache__/nodes.cpython-312.pyc and b/brainstroming_agent/utils/__pycache__/nodes.cpython-312.pyc differ

brainstroming_agent/utils/__pycache__/prompts.cpython-312.pyc CHANGED Viewed

Binary files a/brainstroming_agent/utils/__pycache__/prompts.cpython-312.pyc and b/brainstroming_agent/utils/__pycache__/prompts.cpython-312.pyc differ

brainstroming_agent/utils/nodes.py CHANGED Viewed

@@ -26,7 +26,7 @@ def caption_image(state: State) -> State:
                   {
                       "role": "user",
                       "content": [
-                          {"type": "text", "text": image_captioning_prompt(state.idea,state.business_details)},
                           {
                               "type": "image_url",
                               "image_url": {

                   {
                       "role": "user",
                       "content": [
+                          {"type": "text", "text": image_captioning_prompt(state)},
                           {
                               "type": "image_url",
                               "image_url": {

brainstroming_agent/utils/prompts.py CHANGED Viewed

@@ -34,7 +34,7 @@ Only use the visual cues from the image to inspire your caption, but ensure it f
 Here are the provided **business details** and **video idea** for you. Strongly focus on these two contexts too.
 1. Business details: {state.business_details}
-2. Video idea: {state.video_idea}
 Now generate:
 - A rich 100-word image caption, and

 Here are the provided **business details** and **video idea** for you. Strongly focus on these two contexts too.
 1. Business details: {state.business_details}
+2. Video idea: {state.idea}
 Now generate:
 - A rich 100-word image caption, and

context_analysis_agent/utils/__pycache__/prompts.cpython-312.pyc CHANGED Viewed

Binary files a/context_analysis_agent/utils/__pycache__/prompts.cpython-312.pyc and b/context_analysis_agent/utils/__pycache__/prompts.cpython-312.pyc differ

context_analysis_agent/utils/prompts.py CHANGED Viewed

@@ -1,6 +1,7 @@
 introduction_prompt = '''
 You are a business assistant who collects only valid and relevant data.
 Your job is to gather details from business owners in a friendly and conversational manner to understand their business better. Ask in very easy and short way.
 We need these details:
 1. Business Type (e.g., e-commerce, SaaS, consulting),

 introduction_prompt = '''
 You are a business assistant who collects only valid and relevant data.
 Your job is to gather details from business owners in a friendly and conversational manner to understand their business better. Ask in very easy and short way.
+No matter what the user asks, you have to say to user that we have to collect these details first and only you can move forward.
 We need these details:
 1. Business Type (e.g., e-commerce, SaaS, consulting),

main.py CHANGED Viewed

@@ -9,6 +9,7 @@ from business_interaction_agent.agent import BusinessInteractionChatbot
 from context_analysis_agent.utils.utils import save_to_db
 import ast
 from orchestration_agent.agent import orchestration_chat
 from brainstroming_agent.utils.utils import encode_image_to_base64 , generate_final_story, generate_image
 from idea_to_budget_agent.agent import budget_calculator
 from ideation_agent.agent import ideation_graph
@@ -25,39 +26,24 @@ business_interaction_graph = BusinessInteractionChatbot()
 idea_graph = ideation_graph()
 brainstrom_graph = brainstroming_graph()
 human_refine_graph = human_refined_idea()
-# stored_data={}
-# # stored_data['business_details']={"business_type": "fitness and gym", "platform": "instagram, tiktok", "target_audience": "every software needed clients", "business_goals": "to expand in every cities of nepal", "offerings": "nepali cloths and products", "Challenges_faced": "finding new customers, attracting large customers"}
-# stored_data['business_details'] = {
-#     "business_type": "fitness and gym",
-#     "platform": "Instagram, TikTok",
-#     "target_audience": "young Nepali adults (ages 18–40) who are health-conscious and active on social media",
-#     "business_goals": "to expand gym branches across all major cities of Nepal and build a strong fitness community",
-#     "offerings": "personal training, group fitness classes, modern workout equipment, nutrition guidance, and wellness programs",
-#     "Challenges_faced": "attracting loyal members, standing out in a competitive market, and promoting consistent engagement"
-# }
-# stored_data['final_ideation']= ['''A street magician performs tricks, leaving a crowd awestruck. One trick falters, inspiring him to hit the gym. Months later, he fuses fitness with magic, showcasing strength through performance, proving that transformation can captivate and inspire a community''',
-#                                                   '''A group of strangers attends a quirky food festival, each trying bizarre dishes. One adventurer finds a fitness coach among them. They bond over health, sparking a weekly workout group that brings the community together, blending fun and fitness effortlessly.''',
-#                                                     '''A lost hiker discovers a hidden waterfall, but slips on the rocks, nearly falling. A passing fitness enthusiast helps him up, encouraging regular exercise for safety and strength. Together, they start a hiking club, uniting fitness and nature lovers in their city''',
-#                                                     '''A young Nepali woman discovers a hidden strength within herself while hiking the Himalayas. She returns home, and her fitness journey begins at our gym. With the help of our personal trainers, she transforms her body and mind. The gym becomes her sanctuary, and her transformation inspires others to find their inner strength.''']
-# stored_data['human_ideation_interactions'] = []
-# stored_data['refined_ideation'] = '''A street magician's trick fails, inspiring a fitness journey. Months later, he fuses magic with strength, showcasing transformation. Meanwhile, a fitness coach bonds with foodies over health, sparking a community workout group, blending fun and fitness.'''
-class UserMessage(BaseModel):
     message: str
 @app.post("/orchestration")
-def orchestration_endpoint(msg:UserMessage):
-    response = orchestration_chat(msg.message)
-    return {'tool_response': response.tool, 'message_response':response.message}
 @app.post("/context-analysis")
 def context_analysis(msg: UserMessage):
     response = context_analysis_graph.chat(msg.message)

 from context_analysis_agent.utils.utils import save_to_db
 import ast
 from orchestration_agent.agent import orchestration_chat
+from orchestration_agent.utils.utils import caption_image
 from brainstroming_agent.utils.utils import encode_image_to_base64 , generate_final_story, generate_image
 from idea_to_budget_agent.agent import budget_calculator
 from ideation_agent.agent import ideation_graph
 idea_graph = ideation_graph()
 brainstrom_graph = brainstroming_graph()
 human_refine_graph = human_refined_idea()
+# orchestrate_graph = orchestration_chat()
+class OrchestrationRequest(BaseModel):
     message: str
+    image_base64 : Optional[list] = []
 @app.post("/orchestration")
+def orchestration_endpoint(request:OrchestrationRequest):
+    print('Image:',request.image_base64)
+    result = orchestration_chat(request.message , request.image_base64)
+    stored_data['image_caption']= result.image_caption
+    return {'tool_response': result.tool , 'message_response': result.message, 'image_caption':result.image_caption}
+class UserMessage(BaseModel):
+    message: str
 @app.post("/context-analysis")
 def context_analysis(msg: UserMessage):
     response = context_analysis_graph.chat(msg.message)

orchestration_agent/agent.py CHANGED Viewed

@@ -3,21 +3,27 @@ from langgraph.checkpoint.memory import MemorySaver
 from .utils.nodes import orchestration_node
 from utils.models_loader import llm
 from .utils.state import ValidationFormatter
 import re
 memory = MemorySaver()
-def initialize_workflow():
     workflow = StateGraph(MessagesState)
     workflow.add_node("chatbot", orchestration_node)
     workflow.add_edge(START, "chatbot")
     workflow.add_edge("chatbot", END)
     return workflow.compile(checkpointer=memory)
-def orchestration_chat(user_input: str):
-    agent = initialize_workflow()
     config = {"configurable": {"thread_id": "orchestration-thread"}}
-    response = agent.invoke({"messages": [user_input]}, config)['messages'][-1].content
     response=llm.with_structured_output(ValidationFormatter).invoke(response)
     return response

 from .utils.nodes import orchestration_node
 from utils.models_loader import llm
 from .utils.state import ValidationFormatter
+from .utils.utils import caption_image
 import re
 memory = MemorySaver()
+def orchestration_graph():
     workflow = StateGraph(MessagesState)
     workflow.add_node("chatbot", orchestration_node)
     workflow.add_edge(START, "chatbot")
     workflow.add_edge("chatbot", END)
     return workflow.compile(checkpointer=memory)
+def orchestration_chat(user_input: str, image_base64=[]):
+    if len(image_base64)>0:
+        caption_response = caption_image(image_base64, user_input)
+    else:
+        caption_response =''
+    agent = orchestration_graph()
     config = {"configurable": {"thread_id": "orchestration-thread"}}
+    response = agent.invoke({"messages": [f'''The user's message is:\n {user_input}\nThe information of image is:\n{caption_response}\n''']}, config)['messages'][-1].content
     response=llm.with_structured_output(ValidationFormatter).invoke(response)
     return response

orchestration_agent/utils/prompts.py CHANGED Viewed

@@ -1,29 +1,45 @@
 orchestration_prompt = """
-You are an AI orchestration agent that reads the user's message and decides which one of the following tools should be called next. You're perfect at analyzing the intention of the user.
-Your job is to analyze the user's input and return a JSON object with:
 1. `tool`: the most appropriate tool name from the list below (or `null` if not applicable)
-2. `message`: a clear, helpful message to show to the user. This can be a question, guidance or even an action confirmation depending on the tool.
 ---
 ### Available Tools:
 1. **ideation** → Use if the user wants to create marketing video ideas.
 2. **human-idea-refining** → Use if the user gives feedback or asks to improve/change ideas.
-3. **brainstorm** → Use if the user talks about specific themes, topics, or wants to go deeper into storytelling along with brainstorming.
-4. **generate-final-story** → Use if the user is ready for a final story/script based on ideas and already brainstormed topics.
-5. **generate-image** → Use if the user wants a visual or image based on the story.
 ---
 ### Rules:
-- If the query clearly maps to a tool, return the tool name and a relevant message.
-- If the query is unclear or irrelevant, set `tool` to `null` and return a helpful question in `message`.
-- Your output must ALWAYS be in JSON format like this:
 ### Output Format:
 "tool": "the exact name of the tool",
-"message": "Sure! Here are some creative campaign ideas based on your business."
-"""

 orchestration_prompt = """
+You are a perfect marketing guide and AI orchestration agent that reads the user's message and decides which one of the following tools should be called next. You're perfect at analyzing the intention of the user.
+Also you have to analyze that if any information of the image is provided as te input too. If any information of image is provided, just return that information simply.
+Your job is to analyze the **user's input** only **not the information of the image** and return a JSON object with:
 1. `tool`: the most appropriate tool name from the list below (or `null` if not applicable)
+2. `message`: a clear, helpful message to show to the user. This can be a question, guidance or even an action confirmation depending on the user query. You can guide the user according to their intention.
+3. 'image_caption' : Information of the image if provided, otherwise return a text of **No any information**.
 ---
 ### Available Tools:
 1. **ideation** → Use if the user wants to create marketing video ideas.
 2. **human-idea-refining** → Use if the user gives feedback or asks to improve/change ideas.
+3. **generate-story** → Use if the user talks about **creating the story** from their idea **OR** if the user talks about **creating story with brainstorming**.
+4. **generate-ultimate-story** → Use if the user is ready for a final or ultimate story/script based on ideas and already brainstormed topics from the previous tool called **generate-story**.
+                              Remember one thing, **generate-ultimate-story** is never invoked without invoking **generate-story**.
+5. **generate-image** → Use if the user wants a visual or image based on the ultimate story.
 ---
 ### Rules:
+- Only use the **user's message** for understanding the intent.
+- If the user is **asking about the image**, return the image information as the `message` and set `"tool": null`.
+- If the message **clearly maps to a tool**, return the tool name and a relevant message.
+- If the message is **unclear or not actionable**, set `tool` to `null` and return a helpful clarification question in `message`.
+- If there is no any provided  information of image, just interact with the user according to your job.
+---
 ### Output Format:
 "tool": "the exact name of the tool",
+"message": "Guidance to the business campaigns like asking questions, giving suggestions etc."
+"image_caption" : Information of the image if provided, otherwise return a text of **No any information**.
+"""
+def captioning_prompt(user_input):
+    return f'''
+Caption the image based on the user question if the user asks something about the image.
+If the user question is not relevant to te image provided, just caption the image and give the information provided in the image in just 50 words.
+The user input is:**{user_input}**
+'''

orchestration_agent/utils/state.py CHANGED Viewed

@@ -4,3 +4,4 @@ from pydantic import BaseModel, Field
 class ValidationFormatter(BaseModel):
   tool: str = Field(description="Returns the name of the tool.")
   message: str = Field(description="Returns the message or response of the user query.")

 class ValidationFormatter(BaseModel):
   tool: str = Field(description="Returns the name of the tool.")
   message: str = Field(description="Returns the message or response of the user query.")
+  image_caption: str = Field(description="Returns information of the image if provided. Otherwise returns null.")

orchestration_agent/utils/utils.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import pandas as pd
+import ast
+from groq import Groq
+import os
+from .prompts import captioning_prompt
+def caption_image(image_base64,user_input):
+    if len(image_base64)>0:
+        print('Captioning image')
+        client = Groq(api_key=os.environ.get('GROQ_API_KEY'))
+        chat_completion = client.chat.completions.create(
+            messages=[
+                {
+                    "role": "user",
+                    "content": [
+                        {"type": "text", "text": captioning_prompt(user_input)},
+                        {
+                            "type": "image_url",
+                            "image_url": {
+                                "url": f"data:image/jpg;base64,{image_base64[-1]}",
+                            },
+                        },
+                    ],
+                }
+            ],
+            model="meta-llama/llama-4-scout-17b-16e-instruct",
+            max_completion_tokens=50,
+            temperature = 1
+        )
+        response=chat_completion.choices[0].message.content
+        return response
+    else:
+        return ''