Spaces:

samir72
/

AudioChatTranscriber

Sleeping

App Files Files Community

samir72 commited on Sep 18, 2025

Commit

586cbc6

1 Parent(s): c96bf89

Prompts read from json file

Browse files

Files changed (2) hide show

app.py +44 -4
metadata.json +23 -0

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ from datetime import datetime
 import gradio as gr
 from dotenv import load_dotenv
 from openai import AzureOpenAI  # official OpenAI SDK, works with Azure endpoints
 # --- LLM call (Azure OpenAI with API key) -----------------------------------
@@ -22,6 +23,7 @@ def summarize_audio_b64(audio_b64: str, sys_prompt: str, user_prompt: str) -> st
     if not endpoint or not api_key or not deployment:
         return "Server misconfiguration: required env vars missing."
     try:
         client = AzureOpenAI(
@@ -56,8 +58,30 @@ def summarize_audio_b64(audio_b64: str, sys_prompt: str, user_prompt: str) -> st
     except Exception as ex:
         return print(f"Error from Azure OpenAI: {ex}")
 # --- I/O helpers ------------------------------------------------------------
 def encode_audio_from_path(path: str) -> str:
@@ -120,15 +144,31 @@ with gr.Blocks(title="Audio Summarizer") as demo:
         with gr.Column():
             url_input = gr.Textbox(label="mp3 URL", placeholder="https://example.com/audio.mp3")
     with gr.Row():
         userprompt_input = gr.Textbox(
             label="User Prompt",
-            value="Summarize the audio content",
             placeholder="e.g., Extract key points and action items",
         )
         sysprompt_input = gr.Textbox(
             label="System Prompt",
-            value="You are an AI assistant with a listening charter to clearly analyze the customer enquiry.",
         )
     submit_btn = gr.Button("Summarize")

 import gradio as gr
 from dotenv import load_dotenv
 from openai import AzureOpenAI  # official OpenAI SDK, works with Azure endpoints
+import json
 # --- LLM call (Azure OpenAI with API key) -----------------------------------
     if not endpoint or not api_key or not deployment:
         return "Server misconfiguration: required env vars missing."
     try:
         client = AzureOpenAI(
     except Exception as ex:
         return print(f"Error from Azure OpenAI: {ex}")
+        #pass
+#----Retrieve meta data from metadata.json file------------------------------
+def retrieve_file_path(file_name):
+    path = os.path.dirname(os.path.abspath(__file__))
+    file_path = os.path.join(path, file_name)
+    if os.path.isfile(file_path):
+        return file_path
+    elif not os.path.exists(file_path):
+        print(f"'{file_path}' does not exist.")
+        return None
+    return None
+def retrieve_json_record(file_path, record_id):
+    with open(file_path, 'r') as file:
+        data = json.load(file)
+        if isinstance(data, list):
+            for record in data:
+                if record.get('metadata', {}).get('id') == record_id:
+                    return record
+        elif isinstance(data, dict):
+            if data.get('metadata', {}).get('id') == record_id:
+                return data
+    return None
 # --- I/O helpers ------------------------------------------------------------
 def encode_audio_from_path(path: str) -> str:
         with gr.Column():
             url_input = gr.Textbox(label="mp3 URL", placeholder="https://example.com/audio.mp3")
+    ### Get system and user prompts from metadata.json file
+    file_name = 'metadata.json'
+    record_id = '1'
+    file_path = retrieve_file_path(file_name)
+    jsonrecord = retrieve_json_record(file_path, record_id)
+    if jsonrecord:
+        print(json.dumps(jsonrecord, indent=2))
+    else:
+        print("Record not found.")
+    sysprompt_default = jsonrecord['metadata']['content']['system_prompt']['content']
+    userprompt_default = jsonrecord['metadata']['content']['user_prompt']['content']
     with gr.Row():
         userprompt_input = gr.Textbox(
             label="User Prompt",
+            #value="Summarize the audio content",
+            value=userprompt_default,
             placeholder="e.g., Extract key points and action items",
         )
         sysprompt_input = gr.Textbox(
             label="System Prompt",
+            #value="You are an AI assistant with a charter to clearly analyze the customer enquiry.",
+            value=sysprompt_default,
         )
     submit_btn = gr.Button("Summarize")

metadata.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "metadata": {
+    "id": "1",
+    "timestamp": "2025-09-18T11:24:00Z",
+    "type": "prompt_metadata",
+    "content": {
+      "system_prompt": {
+        "title": "System Prompt",
+        "content": "You are a highly capable AI assistant designed to process and analyze multimodal inputs, including text and images. Your task is to generate a structured response based on the provided input, following a specific format. When an image is uploaded along with a text prompt, analyze the image content and integrate it with the text to produce a coherent response. Use the following format for your response: - **Summary**: Provide a concise summary of the main points from the text and image (if applicable), limited to 2-3 sentences. - **Key Details**: List 3-5 key details extracted from the text and image, presented as bullet points. - **Insights**: Offer 1-2 insightful observations or conclusions based on the content, keeping it brief. Ensure your response is accurate, relevant, and tailored to the input. If the input lacks sufficient information, acknowledge the limitation and provide a general response based on the available data.",
+        "version": "1.0",
+        "created_at": "2025-09-18T11:00:00Z"
+      },
+      "user_prompt": {
+        "title": "User Prompt",
+        "content": "Analyze the attached image and the following text to provide a structured response. Make sure to include a summary, key details, and insights based on the combined information.",
+        "version": "1.0",
+        "created_at": "2025-09-18T11:10:00Z"
+      }
+    },
+    "tags": ["AI", "multimodal", "podcast", "AWS"],
+    "status": "active"
+  }
+}