Spaces:

varun-d-gl
/

Recording-QC-Bot

Sleeping

App Files Files Community

varund2003 commited on Jun 8, 2025

Commit

d8fd28f

0 Parent(s):

Initial project commit

Browse files

Files changed (35) hide show

.env +3 -0
Dockerfile +25 -0
app.py +202 -0
client_secret_522138295664-m3olkqmmocd1h1iqdh5rlgqhl9p6t5mo.apps.googleusercontent.com.json +1 -0
config/checklist.txt +41 -0
config/config.json +12 -0
credentials.json +13 -0
mentor_materials/Agent SDK_V1_24-04-25.txt +53 -0
mentor_materials/Agent_SDK_+_Google_SDK.txt +214 -0
qc_bot.log +238 -0
reports/report_Overview and Key Components of Agent SDK.txt +53 -0
reports/report_Use case of Agent SDK.txt +51 -0
reports/report_Working of Agent SDK.txt +39 -0
requirements.txt +11 -0
src/__init__.py +0 -0
src/__pycache__/__init__.cpython-312.pyc +0 -0
src/__pycache__/main_flow.cpython-312.pyc +0 -0
src/main_flow.py +195 -0
src/preprocessing/__pycache__/download_manager.cpython-312.pyc +0 -0
src/preprocessing/__pycache__/file_processor.cpython-312.pyc +0 -0
src/preprocessing/__pycache__/gdrive_manager.cpython-312.pyc +0 -0
src/preprocessing/__pycache__/transcript_generator.cpython-312.pyc +0 -0
src/preprocessing/__pycache__/video_processor.cpython-312.pyc +0 -0
src/preprocessing/download_manager.py +42 -0
src/preprocessing/file_processor.py +52 -0
src/preprocessing/gdrive_manager.py +93 -0
src/preprocessing/transcript_generator.py +87 -0
src/preprocessing/video_processor.py +51 -0
src/report_generation/__pycache__/openai_client.cpython-312.pyc +0 -0
src/report_generation/__pycache__/report_generator.cpython-312.pyc +0 -0
src/report_generation/openai_client.py +25 -0
src/report_generation/report_generator.py +120 -0
transcripts/Overview and Key Components of Agent SDK.txt +6 -0
transcripts/Use case of Agent SDK.txt +16 -0
transcripts/Working of Agent SDK.txt +3 -0

.env ADDED Viewed

	@@ -0,0 +1,3 @@

+AZURE_SPEECH_KEY=FTm8MJblCZB02npRwB8dR8no2qSBNc8waZymfSxhI9NRQNpTfzBZJQQJ99BCACYeBjFXJ3w3AAAAACOGjJxh
+AZURE_SPEECH_REGION=eastus
+AZURE_OPENAI_KEY=6LKxP1xM2wbfXSOEsnmiTBW63yMGO1W08KFBhuuNd2KQGZSic5DlJQQJ99BCACHYHv6XJ3w3AAAAACOGrHz4

Dockerfile ADDED Viewed

	@@ -0,0 +1,25 @@

+FROM python:3.9-slim
+WORKDIR /app
+# Install system dependencies
+RUN apt-get update && \
+    apt-get install -y ffmpeg && \
+    rm -rf /var/lib/apt/lists/*
+# Copy application files
+COPY . .
+# Install Python dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+# Set environment variables
+ENV AZURE_SPEECH_KEY=$AZURE_SPEECH_KEY
+ENV AZURE_SPEECH_REGION=$AZURE_SPEECH_REGION
+ENV AZURE_OPENAI_KEY=$AZURE_OPENAI_KEY
+# Expose port
+EXPOSE 8501
+# Run the application
+CMD ["streamlit", "run", "app.py", "--server.port=8501", "--server.address=0.0.0.0"]

app.py ADDED Viewed

	@@ -0,0 +1,202 @@

+# app.py
+import streamlit as st
+import os
+import asyncio
+import logging
+import time
+from src.preprocessing.gdrive_manager import GoogleDriveManager
+from src.main_flow import MainFlow
+from dotenv import load_dotenv
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s %(levelname)s %(name)s: %(message)s",
+    handlers=[
+        logging.FileHandler("qc_bot.log", mode='a', encoding='utf-8'),
+        logging.StreamHandler()
+    ]
+)
+logger = logging.getLogger(__name__)
+# Load environment variables
+load_dotenv()
+# Initialize MainFlow
+main_flow = MainFlow("config/config.json")
+# Streamlit UI
+st.set_page_config(
+    page_title="QC Report Generator",
+    page_icon="📊",
+    layout="wide"
+)
+# Custom CSS
+st.markdown("""
+    <style>
+    .stButton>button {
+        background-color: #4CAF50;
+        color: white;
+        font-weight: bold;
+        padding: 10px 24px;
+        border-radius: 5px;
+    }
+    .report-box {
+        border: 1px solid #e0e0e0;
+        border-radius: 10px;
+        padding: 20px;
+        margin: 10px 0;
+        background-color: #f9f9f9;
+    }
+    .success-banner {
+        background-color: #d4edda;
+        color: #155724;
+        padding: 15px;
+        border-radius: 5px;
+        margin: 20px 0;
+        text-align: center;
+    }
+    .warning-banner {
+        background-color: #fff3cd;
+        color: #856404;
+        padding: 15px;
+        border-radius: 5px;
+        margin: 20px 0;
+    }
+    </style>
+""", unsafe_allow_html=True)
+# Initialize session state
+if 'processing' not in st.session_state:
+    st.session_state.processing = False
+if 'reports_generated' not in st.session_state:
+    st.session_state.reports_generated = False
+if 'video_type' not in st.session_state:
+    st.session_state.video_type = "conceptual"
+# App header
+st.title("📊 QC Report Generator")
+st.subheader("Automated Quality Control for Training Videos")
+# Configuration Section
+with st.expander("⚙️ Configuration", expanded=True):
+    st.session_state.video_type = st.radio(
+        "Select Video Type:",
+        ["conceptual", "hands-on", "both"],
+        format_func=lambda x: {
+            "conceptual": "Conceptual Explanation",
+            "hands-on": "Hands-on Demonstration",
+            "both": "Both"
+        }[x]
+    )
+    drive_url = st.text_input(
+        "Google Drive Videos Folder URL:",
+        placeholder="https://drive.google.com/drive/folders/1KSdVSVs_yN6FHvzH0i0CW2wNI0tCPhGt",
+        help="URL of the folder containing videos"
+    )
+    mentor_files = {}
+    if st.session_state.video_type in ["conceptual", "both"]:
+        mentor_files["slides"] = st.file_uploader(
+            "Upload Presentation (PPTX):",
+            type=["pptx", "ppt"]
+        )
+    if st.session_state.video_type in ["hands-on", "both"]:
+        mentor_files["notebook"] = st.file_uploader(
+            "Upload Notebook (IPYNB):",
+            type=["ipynb"]
+        )
+    if st.button("Generate Reports", disabled=st.session_state.processing):
+        if not drive_url:
+            st.error("Please enter a Google Drive URL")
+        else:
+            st.session_state.processing = True
+            st.session_state.reports_generated = False
+# Processing
+if st.session_state.processing:
+    status_area = st.empty()
+    progress_bar = st.progress(0)
+    # Processing steps
+    steps = [
+        "Downloading videos from Google Drive",
+        "Processing mentor materials",
+        "Generating transcripts",
+        "Creating quality reports"
+    ]
+    for i, step in enumerate(steps):
+        progress = int((i + 1) * 25)
+        status_area.info(f"⏳ **Step {i+1}/4**: {step}")
+        progress_bar.progress(progress)
+        try:
+            if i == 0:
+                # Process mentor materials FIRST
+                main_flow.process_mentor_materials(mentor_files)
+            elif i == 1:
+                # Download and process videos
+                asyncio.run(main_flow.process_drive_url(drive_url))
+            elif i == 2:
+                # Transcripts generated automatically
+                pass
+            elif i == 3:
+                # Generate reports
+                main_flow.generate_quality_reports()
+        except Exception as e:
+            status_area.error(f"❌ Error in step {i+1}: {str(e)}")
+            st.session_state.processing = False
+            st.stop()
+        time.sleep(1)  # Simulate processing time
+    status_area.success("✅ Processing completed!")
+    st.session_state.processing = False
+    st.session_state.reports_generated = True
+    st.balloons()
+# Sync reports from Google Drive
+def sync_reports_from_drive(main_flow):
+    gdrive = GoogleDriveManager()
+    report_drive_files = gdrive.list_txt_files(main_flow.drive_folders["REPORTS"])
+    for file in report_drive_files:
+        local_path = os.path.join(main_flow.paths["REPORTS"], file["name"])
+        if not os.path.exists(local_path):
+            gdrive.download_file(file["id"], local_path)
+# Display Reports
+if st.session_state.reports_generated:
+    # Sync reports before displaying
+    sync_reports_from_drive(main_flow)
+    st.divider()
+    st.subheader("📋 Generated Reports")
+    reports_dir = main_flow.paths["REPORTS"]
+    report_files = [f for f in os.listdir(reports_dir) if f.endswith(".txt")]
+    if report_files:
+        for report_file in report_files:
+            with st.expander(f"📝 {report_file.replace('report_', '').replace('.txt', '')}"):
+                try:
+                    with open(os.path.join(reports_dir, report_file), "r", encoding="utf-8") as f:
+                        report_content = f.read()
+                    # Display report with formatting
+                    st.markdown(report_content)
+                    # Download button
+                    st.download_button(
+                        label=f"Download {report_file}",
+                        data=report_content,
+                        file_name=report_file,
+                        mime="text/plain",
+                        key=f"dl_{report_file}"
+                    )
+                except Exception as e:
+                    st.error(f"Error reading report: {str(e)}")
+    else:
+        st.info("No reports found. Please generate reports first.")

client_secret_522138295664-m3olkqmmocd1h1iqdh5rlgqhl9p6t5mo.apps.googleusercontent.com.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"web":{"client_id":"522138295664-m3olkqmmocd1h1iqdh5rlgqhl9p6t5mo.apps.googleusercontent.com","project_id":"neon-net-462111-k2","auth_uri":"https://accounts.google.com/o/oauth2/auth","token_uri":"https://oauth2.googleapis.com/token","auth_provider_x509_cert_url":"https://www.googleapis.com/oauth2/v1/certs","client_secret":"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"}}

config/checklist.txt ADDED Viewed

	@@ -0,0 +1,41 @@

+AO Checklist
+-------------
+1. Content Accuracy & Coverage:
+   a. Topic and Subtopic Coverage: Confirm that all planned topics and subtopics are mentioned and explained.
+   b. Logical and Sequential Explanation: Ensure concepts are introduced in a structured, progressive order.
+   c. Factual Accuracy: Verify all statements are technically correct without conceptual inaccuracies.
+   d. Use of Examples and Analogies: Check for relevant examples/analogies for complex concepts.
+2. Code Walkthrough & Demonstration (if applicable):
+   a. Clear Execution of Code Demos: Code demonstrations should be clearly explained through narration.
+   b. Complete Explanation of Code Components: Variables, functions, and logic blocks should be described.
+   c. Mention of Libraries/Tools: All libraries/frameworks used should be explicitly named and explained.
+   d. Output Validation: Expected code outputs should be described and discussed.
+   e. Demonstration Pacing: Hands-on activities should be taught at a followable pace.
+3. Speech Clarity & Language Quality:
+   a. Clear and Understandable Speech: Speech should be coherent and paced appropriately.
+   b. Minimized Use of Filler Words: Avoid frequent fillers like "umm", "uh", "hmm", "ah".
+   c. Pronunciation of Technical Terms: Technical terms should be pronounced clearly.
+   d. Professional Language: Language must be formal, academic, and respectful.
+   e. No Inappropriate/Biased Statements: Avoid insensitive or biased language.
+4. Alignment with Visual Content:
+   a. Narration Matches Slide Order: Spoken content should follow the slide sequence.
+5. Student Engagement Prompts:
+   a. Calls to Action or Pause for Reflection: Prompt learners to try things themselves.
+   b. Questions to Learners: Include rhetorical questions to engage learners.
+   c. Invites Feedback or Queries: Encourage questions through comments/forums.
+6. Session Structure & Flow:
+   a. Proper Opening/Greeting: Start with clear introduction setting context.
+   b. Clear Transitions Between Sections: Use verbal cues for topic shifts.
+7. Tone, Motivation & Inclusivity:
+   a. Encouraging and Positive Tone: Use motivational language.
+   b. Inclusive Language: Gender-neutral and inclusive of all backgrounds.
+8. Time Management Indicators:
+   a. Adherence to Time Markers: Actual pacing should match mentioned time estimates.

config/config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "PATHS": {
+    "VIDEOS": "videos",
+    "AUDIOS": "audios",
+    "TRANSCRIPTS": "transcripts",
+    "REPORTS": "reports",
+    "MENTOR_MATERIALS": "mentor_materials"
+  },
+  "AZURE_OPENAI_ENDPOINT": "https://tst123451307193883.openai.azure.com/",
+  "AZURE_OPENAI_APIVERSION": "2025-01-01-preview",
+  "CHATGPT_MODEL": "gpt-4o-mini"
+}

credentials.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "type": "service_account",
+  "project_id": "neon-net-462111-k2",
+  "private_key_id": "cc77a1185d7e0467ebe7072a971932f286f2f0be",
+  "private_key": "-----BEGIN PRIVATE KEY-----\nMIIEvQIBADANBgkqhkiG9w0BAQEFAASCBKcwggSjAgEAAoIBAQC0rgQBpIK2+SSG\njAXPJJZHfPuPVBTcLxnh6atAo0dUmNPCYEvUkUlSZi/HhZm0Bomn7ALi9+pC04bV\nU5ha1vCqlM73QDFSnPXTuL4kB1IG656VVv+DEFT+nqMwUxnTH8a742TrTB5i+YhO\n49GtQpGljgS0fRl8kYUClEZygbq5PiYScI2fM8aZCMYtqx+9qlrY5KXGHKz2sH1S\nFUoStHIxkI2UHPmG+j6z8y+8lQbZrrmE5QBrfuksFd/O3rI9qX0al7qQOv+UDFRM\ncFZKoG3kGyCVV1ZqCLiK5N8E3I3l41GaozEUZd1fBxyujaD/Q00a/91EdbaRXbO3\nEX6bWjoDAgMBAAECggEACew0oOwQy01LfQgoZlCzRog0Pvh2XNFJZQEyooFVFyEX\nIBzhwHIDynHj1du3rg3EQzCdYZGnKYLGBbLQy/+NIBEkFkTncIrZa7mnPgGyg40u\ntgAdI2y8l9WZtYga0JMO+wQ2AQyHiEmXLtEo+fbzjYzX8IGeULUKAcynqDCi7JSU\nv1scypeODrm5wO2+KwEZ4s0Wby1mXDgYcbG3Gnq3FVv8p/VEBhs/R9wBC9iJdICm\nKyHW36iSfanKJtCKV2IBjOKkqz2YcCtnpaD/07Zo4zy1tBZMicUeAod4J/yAMiOZ\nAtFHVc223JzsZupkpnwtdVCpdpTB4vw81LBF5olEIQKBgQDgcNZz6IL2ABtzGE+b\ncOQ6WQBBFY9yOO4CQ+RBG5HNQ8/HYk1Uvg0OP/KrbqDfEv8rC4EyxWZmoX7ibpMY\nmgAA4MBpLDalXB8K8PV5lzh4uye6YV9kyKgkg979vnxs9Q5cX1oa+7qG1hx8zbZu\nzsL8FqaS/6vTYGrixdqI3phklQKBgQDOFessthjXbx6uVdzcgEPQ5rq13oo31oIF\nXpxLaZsM8H5XLwAC40RSFq1u3QFgt69PRapyNx7Jc88qK+zVcsJI7DawKyAHh19j\nHfr1LLtVJkbOj4XeZIurGQMvcH4o49Dr5g4KROvCmJRnRdAOrWXrDpxoMiM/GwEN\n/RXi/NSmNwKBgHeejB2wkYPtILQiA+OzsmAKqWEGzbIx92BLsO6mc/nzp1z73n1I\n4YpzuLF3v9PEuyzE7/IQVXhjoE2sY0ecZF4Ta1likClnxL+/FwXb++QU06K5XO9J\nJpx3kDSq/oPPw/ylcU+qVIqiuQInXZEHL9LNe7AjBgAdhjog+00xXgVVAoGBAJIL\nEGTYCtSox3pOGL0eHHDvAYOe2B5n4i5B9MqwZROPXkkUYpKpUaJGtdMpxS8wHIk1\n2mskSqoCat380NIWiD47Pyoq9YDAW0WXWl/iukLGZEk/hmOqpxuyFwLIWm9JuqVh\nm7OFUfnOPOTOoXm1QdOIwChK15WB4oZyQs9f0qaTAoGAPKQrkVItvZA/7GLo4uPx\ngICeL+/D8n/BslfF9/XR4++0TKDv1uZM004SCMpUoIoklhxmVxi+aQeA/0VbDID5\nMjQst7QYQ4eaa7znvG3XFN9i96iU2sKAIb4ufITyC3XTxE5sH8b3w03uEhgil/GV\n4GZP+m8IcqsEr5koc/Jdq9k=\n-----END PRIVATE KEY-----\n",
+  "client_email": "recording-qc-bot@neon-net-462111-k2.iam.gserviceaccount.com",
+  "client_id": "103182639505940473738",
+  "auth_uri": "https://accounts.google.com/o/oauth2/auth",
+  "token_uri": "https://oauth2.googleapis.com/token",
+  "auth_provider_x509_cert_url": "https://www.googleapis.com/oauth2/v1/certs",
+  "client_x509_cert_url": "https://www.googleapis.com/robot/v1/metadata/x509/recording-qc-bot%40neon-net-462111-k2.iam.gserviceaccount.com",
+  "universe_domain": "googleapis.com"
+}

mentor_materials/Agent SDK_V1_24-04-25.txt ADDED Viewed

	@@ -0,0 +1,53 @@

+=== Slide 1 ===
+Agent SDK
+=== Slide 2 ===
+Agenda
+In this session, we'll discuss: Introduction to Agent SDK Key Components of Agent SDK Working of Agent SDK Use Cases of Agent SDK Benefits and Challenges of Agent SDK
+=== Slide 3 ===
+Introduction to Agent SDK
+=== Slide 4 ===
+Introduction to Agent SDK
+Toolkit for building autonomous AI agents Provides resources, tools, and libraries Helps create flexible and reusable AI systems Enables integration of goals, tools, and memory in agents
+What is Agent SDK?
+=== Slide 5 ===
+Key Components of Agent SDK
+=== Slide 6 ===
+Key Components of Agent SDK
+Goals
+Tools
+Memory
+Reasoning Loops
+=== Slide 7 ===
+Working of Agent SDK
+=== Slide 8 ===
+Working of Agent SDK
+Prompt
+Tool
+Action
+Result
+=== Slide 9 ===
+Use Cases of Agent SDK
+=== Slide 10 ===
+Benefits and Challenges of Agent SDK
+=== Slide 11 ===
+Benefits of using Agent SDK
+=== Slide 12 ===
+Challenges in using Agent SDK
+=== Slide 13 ===
+Summary
+Let's quickly recap: Agent SDK is a framework that helps create autonomous agents capable of performing tasks and interacting with external services. Key components include goals (objectives), memory (stores data), tools (external resources), and a reasoning loop (logic to decide actions). It allows agents to store information, interact with tools, and make decisions to achieve their goals autonomously. Agent SDK provides autonomy, modularity, and flexibility in task automation. Challenges include complex integration and debugging. Additionally, managing external resources can be difficult.
+=== Slide 14 ===
+Thank You

mentor_materials/Agent_SDK_+_Google_SDK.txt ADDED Viewed

	@@ -0,0 +1,214 @@

+## MARKDOWN CELL ##
+Problem Statement:
+Building an AI Agent Using Google SDK to Automate Real-Time Web Search Tasks
+Objective:
+Develop a simple autonomous AI Agent that takes a user-defined goal, performs real-time web searches using the Google Custom Search API (Google SDK), and presents relevant results to the user. The agent should also retain memory of past goals and results for reference.
+----
+## MARKDOWN CELL ##
+Key Features:
+* Accept a user-defined goal (search query).
+* Use Google Custom Search API to fetch top search results.
+* Display the top 3 results including title, URL, and snippet.
+* Store the goal and results in memory for future use.
+* Provide an option to refine the goal manually or conclude the session.
+----
+## MARKDOWN CELL ##
+Expected Outcome:
+* A functional, interactive AI Agent that demonstrates
+ Goal → Tool → Action → Result
+* Real-time search result delivery based on user inputs.
+* A memory system that logs all goals and search outcomes during the session.
+----
+## CODE CELL ##
+# === Install the required package ===
+!pip install google-api-python-client
+# === Import necessary modules ===
+from googleapiclient.discovery import build
+# === API Configuration ===
+# === Memory to store past goals and results ===
+memory = []
+# === Define the tool function using Google SDK ===
+def google_search(query):
+    print(f"\n[Tool] Searching Google for: '{query}'")
+    service = build("customsearch", "v1", developerKey=API_KEY)
+    res = service.cse().list(q=query, cx=SEARCH_ENGINE_ID).execute()
+    return res['items']
+# === Define the AI Agent's Reasoning Loop ===
+def agent_reasoning_loop(goal):
+    print(f"\n[Agent] Received Goal: '{goal}'")
+    # Use Google Search Tool
+    results = google_search(goal)
+    # Display Top 3 Results
+    print(f"\n[Agent] Top 3 Results for '{goal}':\n")
+    for idx, item in enumerate(results[:3]):
+        print(f"Result {idx+1}:")
+        print("Title:", item['title'])
+        print("URL:", item['link'])
+        print("Snippet:", item['snippet'])
+        print("-" * 50)
+    # Store in Memory
+    memory.append({'goal': goal, 'results': results[:3]})
+    print(f"\n[Memory] Stored Goal & Results. Total stored goals: {len(memory)}")
+# === Real-Time Interaction ===
+print("Welcome to AI Agent + Google SDK!")
+# Take user input for search goal
+user_goal = input("Enter your search goal (e.g., 'top AI research labs in 2025'): ")
+# Run the reasoning loop with the user's goal
+agent_reasoning_loop(user_goal)
+# === Show all memory at the end ===
+print("\n=== Final Memory Log ===")
+for m in memory:
+    print(f"\nGoal: {m['goal']}")
+    for r in m['results']:
+        print(f" - {r['title']} ({r['link']})")
+----
+## MARKDOWN CELL ##
+Constraints:
+* The agent operates only with manual refinement (no AI-generated refinements).
+* Search is limited to what the Google Custom Search API can return within quota limits.
+----
+## MARKDOWN CELL ##
+Enhancements:
+* Let GPT also summarize the search results.
+* Automatically generate next questions based on the results.
+* Add multi-turn conversations where GPT acts as a guide.
+----
+## MARKDOWN CELL ##
+Old Constraint:
+* Manual refinement needed after each search.
+Now:
+* GPT automatically refines queries based on the original goal.
+The agent becomes self-sufficient:
+* It thinks (refines),
+* Acts (searches),
+* Learns (stores memory).
+----
+## MARKDOWN CELL ##
+Flow of Execution:
+* Agent receives goal → e.g., "top AI research labs in 2025".
+* Searches Google using that goal.
+* Refines goal using GPT → e.g., "leading artificial intelligence research institutes worldwide 2025".
+* Searches Google again using GPT-refined goal.
+* Stores both goals and results in memory.
+----
+## CODE CELL ##
+# === Imports ===
+import openai
+from googleapiclient.discovery import build
+# === API Keys ===
+API_KEY = 'AIzaSyDZGmR6WcCU61cxpwSq70-jnJcOeh9PHHI'  # <-- Replace with your API Key
+SEARCH_ENGINE_ID = 'd16ee106ddcee4931'  # <-- Replace with your Search Engine ID
+openai.api_key = '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'  # <-- Replace this
+# === Memory Store ===
+memory = []
+# === Tool 1: Google Search ===
+def google_search(query):
+    print(f"\n[Tool] Searching Google for: '{query}'")
+    service = build("customsearch", "v1", developerKey=API_KEY)
+    res = service.cse().list(q=query, cx=SEARCH_ENGINE_ID).execute()
+    return res['items']
+# === Tool 2: OpenAI GPT for Refinement (Updated Syntax) ===
+def refine_query_with_gpt(original_query):
+    print(f"\n[GPT] Refining query for: '{original_query}'")
+    prompt = f"Suggest a more detailed and specific version of this search query: '{original_query}'"
+    response = openai.chat.completions.create(
+        model="gpt-3.5-turbo",  # or "gpt-4"
+        messages=[{"role": "user", "content": prompt}],
+        temperature=0.7,
+        max_tokens=50
+    )
+    refined_query = response.choices[0].message.content.strip()
+    print(f"[GPT] Refined Query: '{refined_query}'")
+    return refined_query
+# === AI Agent's Reasoning Loop ===
+def agent_reasoning_loop(goal):
+    print(f"\n[Agent] Received Goal: '{goal}'")
+    # First search with original goal
+    results_original = google_search(goal)
+    # Display Top 3 Results (Original)
+    print(f"\n[Agent] Top 3 Results for Original Goal '{goal}':\n")
+    for idx, item in enumerate(results_original[:3]):
+        print(f"Result {idx+1}:")
+        print("Title:", item['title'])
+        print("URL:", item['link'])
+        print("Snippet:", item['snippet'])
+        print("-" * 50)
+    # Refine goal using GPT
+    refined_goal = refine_query_with_gpt(goal)
+    results_refined = google_search(refined_goal)
+    # Display Top 3 Results (Refined)
+    print(f"\n[Agent] Top 3 Results for Refined Goal '{refined_goal}':\n")
+    for idx, item in enumerate(results_refined[:3]):
+        print(f"Result {idx+1}:")
+        print("Title:", item['title'])
+        print("URL:", item['link'])
+        print("Snippet:", item['snippet'])
+        print("-" * 50)
+    # Store both in memory
+    memory.append({
+        'original_goal': goal,
+        'refined_goal': refined_goal,
+        'results_original': results_original[:3],
+        'results_refined': results_refined[:3]
+    })
+    print(f"\n[Memory] Stored Original & Refined Goals. Total stored: {len(memory)}")
+# === Run Agent with User Input ===
+print("Welcome to AI Agent with OpenAI GPT + Google SDK!")
+# Get the user goal via input
+user_goal = input("Enter your search goal (e.g., 'latest AI trends 2025'): ")
+# Run the reasoning loop with the user's goal
+agent_reasoning_loop(user_goal)
+# === Show Memory Log ===
+print("\n=== Final Memory Log ===")
+for m in memory:
+    print(f"\nOriginal Goal: {m['original_goal']}")
+    print(f"Refined Goal: {m['refined_goal']}")
+    for r in m['results_refined']:
+        print(f" - {r['title']} ({r['link']})")
+----

qc_bot.log ADDED Viewed

	@@ -0,0 +1,238 @@

+2025-06-08 17:26:41,288 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:26:41,290 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:26:44,499 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:27:04,776 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:27:15,608 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:27:20,379 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:27:22,838 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:27:22,860 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf?usp=sharing
+2025-06-08 17:27:23,105 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 17:27:24,017 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 17:27:30,436 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 17:27:36,502 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 17:27:42,513 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 17:27:48,578 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 17:27:54,620 INFO src.preprocessing.gdrive_manager: Download 68%
+2025-06-08 17:28:00,367 INFO src.preprocessing.gdrive_manager: Download 82%
+2025-06-08 17:28:06,293 INFO src.preprocessing.gdrive_manager: Download 96%
+2025-06-08 17:28:09,762 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 17:28:09,762 INFO src.preprocessing.gdrive_manager: Download complete: videos\Use case of Agent SDK.mp4
+2025-06-08 17:28:09,764 INFO src.preprocessing.download_manager: Downloaded: Use case of Agent SDK.mp4
+2025-06-08 17:28:09,764 INFO src.main_flow: Processing video: Use case of Agent SDK.mp4
+2025-06-08 17:28:13,704 INFO src.main_flow: Converted video to audio: audios\Use case of Agent SDK.wav
+2025-06-08 17:28:18,268 INFO src.preprocessing.gdrive_manager: Uploaded audios\Use case of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 17:28:18,830 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 17:28:18,831 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 17:37:02,253 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:15,378 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:16,444 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:20,983 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:24,543 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:25,943 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:37:25,970 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf
+2025-06-08 17:37:26,192 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 17:37:27,055 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 17:37:34,060 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 17:37:41,520 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 17:37:48,595 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 17:37:54,638 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 17:38:29,171 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:38:50,946 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:38:54,122 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:38:58,463 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:39:04,578 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:39:06,168 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 17:39:06,193 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf?usp=sharing
+2025-06-08 17:39:06,425 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 17:39:07,316 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 17:39:13,427 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 17:39:19,466 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 17:39:25,895 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 17:39:31,921 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 17:39:37,980 INFO src.preprocessing.gdrive_manager: Download 68%
+2025-06-08 17:39:43,722 INFO src.preprocessing.gdrive_manager: Download 82%
+2025-06-08 17:39:49,857 INFO src.preprocessing.gdrive_manager: Download 96%
+2025-06-08 17:39:53,573 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 17:39:53,574 INFO src.preprocessing.gdrive_manager: Download complete: videos\Use case of Agent SDK.mp4
+2025-06-08 17:39:53,575 INFO src.preprocessing.download_manager: Downloaded: Use case of Agent SDK.mp4
+2025-06-08 17:39:53,576 INFO src.main_flow: Processing video: Use case of Agent SDK.mp4
+2025-06-08 17:39:57,339 INFO src.main_flow: Converted video to audio: audios\Use case of Agent SDK.wav
+2025-06-08 17:40:05,307 INFO src.preprocessing.gdrive_manager: Uploaded audios\Use case of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 17:40:05,813 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 17:40:05,814 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 17:49:38,100 INFO src.preprocessing.transcript_generator: Transcript saved to transcripts\Use case of Agent SDK.txt
+2025-06-08 17:49:38,109 INFO src.main_flow: Generated transcript: transcripts\Use case of Agent SDK.txt
+2025-06-08 17:49:40,243 INFO src.preprocessing.gdrive_manager: Uploaded transcripts\Use case of Agent SDK.txt to Drive folder 1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3
+2025-06-08 17:49:41,240 INFO src.preprocessing.gdrive_manager: Deleted file 1OVvobHvzntShRprzt0L6OdW5eRFn2-xb from Drive
+2025-06-08 17:49:41,662 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 17:49:47,940 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 17:49:53,844 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 17:50:01,022 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 17:50:07,310 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 17:50:13,325 INFO src.preprocessing.gdrive_manager: Download 68%
+2025-06-08 17:50:19,681 INFO src.preprocessing.gdrive_manager: Download 82%
+2025-06-08 17:50:25,851 INFO src.preprocessing.gdrive_manager: Download 96%
+2025-06-08 17:50:29,724 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 17:50:29,727 INFO src.preprocessing.gdrive_manager: Download complete: videos\Use case of Agent SDK.mp4
+2025-06-08 17:50:29,730 INFO src.preprocessing.download_manager: Downloaded: Use case of Agent SDK.mp4
+2025-06-08 17:50:29,731 INFO src.main_flow: Processing video: Use case of Agent SDK.mp4
+2025-06-08 17:50:35,469 INFO src.main_flow: Converted video to audio: audios\Use case of Agent SDK.wav
+2025-06-08 17:50:44,607 INFO src.preprocessing.gdrive_manager: Uploaded audios\Use case of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 17:50:45,158 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 17:50:45,159 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 18:00:17,517 INFO src.preprocessing.transcript_generator: Transcript saved to transcripts\Use case of Agent SDK.txt
+2025-06-08 18:00:17,522 INFO src.main_flow: Generated transcript: transcripts\Use case of Agent SDK.txt
+2025-06-08 18:00:19,461 INFO src.preprocessing.gdrive_manager: Uploaded transcripts\Use case of Agent SDK.txt to Drive folder 1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3
+2025-06-08 18:00:20,515 INFO src.preprocessing.gdrive_manager: Deleted file 1WIvxSHPx95N2bx4XFF4FIPtUnQhofasU from Drive
+2025-06-08 18:00:20,942 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 18:00:28,170 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 18:00:35,470 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 18:00:42,724 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 18:00:49,442 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 18:00:55,637 INFO src.preprocessing.gdrive_manager: Download 68%
+2025-06-08 18:01:02,125 INFO src.preprocessing.gdrive_manager: Download 82%
+2025-06-08 18:01:08,557 INFO src.preprocessing.gdrive_manager: Download 96%
+2025-06-08 18:01:12,266 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 18:01:12,267 INFO src.preprocessing.gdrive_manager: Download complete: videos\Use case of Agent SDK.mp4
+2025-06-08 18:01:12,268 INFO src.preprocessing.download_manager: Downloaded: Use case of Agent SDK.mp4
+2025-06-08 18:01:12,269 INFO src.main_flow: Processing video: Use case of Agent SDK.mp4
+2025-06-08 18:01:16,407 INFO src.main_flow: Converted video to audio: audios\Use case of Agent SDK.wav
+2025-06-08 18:01:21,032 INFO src.preprocessing.gdrive_manager: Uploaded audios\Use case of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 18:01:21,557 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 18:01:21,558 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 18:08:21,623 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:08:22,230 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:08:26,332 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:09:27,158 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:09:30,596 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:09:36,990 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:09:39,314 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:09:39,341 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf?usp=sharing
+2025-06-08 18:09:39,564 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:09:40,779 INFO src.preprocessing.gdrive_manager: Downloading file 1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR to videos\Use case of Agent SDK.mp4
+2025-06-08 18:09:48,341 INFO src.preprocessing.gdrive_manager: Download 13%
+2025-06-08 18:09:54,815 INFO src.preprocessing.gdrive_manager: Download 27%
+2025-06-08 18:10:01,854 INFO src.preprocessing.gdrive_manager: Download 41%
+2025-06-08 18:10:08,034 INFO src.preprocessing.gdrive_manager: Download 54%
+2025-06-08 18:10:14,353 INFO src.preprocessing.gdrive_manager: Download 68%
+2025-06-08 18:10:20,880 INFO src.preprocessing.gdrive_manager: Download 82%
+2025-06-08 18:10:26,969 INFO src.preprocessing.gdrive_manager: Download 96%
+2025-06-08 18:10:30,770 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 18:10:30,771 INFO src.preprocessing.gdrive_manager: Download complete: videos\Use case of Agent SDK.mp4
+2025-06-08 18:10:30,772 INFO src.main_flow: Downloaded: Use case of Agent SDK.mp4
+2025-06-08 18:10:34,935 INFO src.main_flow: Converted video to audio: audios\Use case of Agent SDK.wav
+2025-06-08 18:10:39,644 INFO src.preprocessing.gdrive_manager: Uploaded audios\Use case of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 18:10:40,151 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 18:10:40,151 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1lmf1nOopxUxdJUWKd6Xq-OTAQdrWorIR? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 18:20:12,037 INFO src.preprocessing.transcript_generator: Transcript saved to transcripts\Use case of Agent SDK.txt
+2025-06-08 18:20:12,262 INFO src.main_flow: Generated transcript: transcripts\Use case of Agent SDK.txt
+2025-06-08 18:20:14,382 INFO src.preprocessing.gdrive_manager: Uploaded transcripts\Use case of Agent SDK.txt to Drive folder 1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3
+2025-06-08 18:20:15,400 INFO src.preprocessing.gdrive_manager: Deleted file 1BMBHClP2MjbnQg-3jI0DldLo66plM5eU from Drive
+2025-06-08 18:20:15,409 INFO src.preprocessing.gdrive_manager: Downloading file 1cxXlHB38p3oBm1cEr4LWqyzMDQqRj3VJ to videos\Working of Agent SDK.mp4
+2025-06-08 18:20:22,045 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 18:20:22,046 INFO src.preprocessing.gdrive_manager: Download complete: videos\Working of Agent SDK.mp4
+2025-06-08 18:20:22,047 INFO src.main_flow: Downloaded: Working of Agent SDK.mp4
+2025-06-08 18:20:22,624 INFO src.main_flow: Converted video to audio: audios\Working of Agent SDK.wav
+2025-06-08 18:20:25,332 INFO src.preprocessing.gdrive_manager: Uploaded audios\Working of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 18:20:25,863 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 18:20:25,865 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1cxXlHB38p3oBm1cEr4LWqyzMDQqRj3VJ? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 18:20:57,038 INFO src.preprocessing.transcript_generator: Transcript saved to transcripts\Working of Agent SDK.txt
+2025-06-08 18:20:57,433 INFO src.main_flow: Generated transcript: transcripts\Working of Agent SDK.txt
+2025-06-08 18:20:59,342 INFO src.preprocessing.gdrive_manager: Uploaded transcripts\Working of Agent SDK.txt to Drive folder 1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3
+2025-06-08 18:21:00,515 INFO src.preprocessing.gdrive_manager: Deleted file 1h87GpnkRFs8flu5PVticplmIFa2IXsTH from Drive
+2025-06-08 18:21:00,517 INFO src.preprocessing.gdrive_manager: Downloading file 1LeCsQBqZLrGFTOLzNCOV57RDO5nZWqfS to videos\Overview and Key Components of Agent SDK.mp4
+2025-06-08 18:21:10,786 INFO src.preprocessing.gdrive_manager: Download 77%
+2025-06-08 18:21:14,307 INFO src.preprocessing.gdrive_manager: Download 100%
+2025-06-08 18:21:14,307 INFO src.preprocessing.gdrive_manager: Download complete: videos\Overview and Key Components of Agent SDK.mp4
+2025-06-08 18:21:14,308 INFO src.main_flow: Downloaded: Overview and Key Components of Agent SDK.mp4
+2025-06-08 18:21:15,609 INFO src.main_flow: Converted video to audio: audios\Overview and Key Components of Agent SDK.wav
+2025-06-08 18:21:18,413 INFO src.preprocessing.gdrive_manager: Uploaded audios\Overview and Key Components of Agent SDK.wav to Drive folder 1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG
+2025-06-08 18:21:18,942 WARNING googleapiclient.http: Encountered 403 Forbidden with reason "insufficientFilePermissions"
+2025-06-08 18:21:18,943 ERROR src.preprocessing.gdrive_manager: An error occurred: <HttpError 403 when requesting https://www.googleapis.com/drive/v3/files/1LeCsQBqZLrGFTOLzNCOV57RDO5nZWqfS? returned "The user does not have sufficient permissions for this file.". Details: "[{'message': 'The user does not have sufficient permissions for this file.', 'domain': 'global', 'reason': 'insufficientFilePermissions'}]">
+2025-06-08 18:23:10,783 INFO src.preprocessing.transcript_generator: Transcript saved to transcripts\Overview and Key Components of Agent SDK.txt
+2025-06-08 18:23:10,804 INFO src.main_flow: Generated transcript: transcripts\Overview and Key Components of Agent SDK.txt
+2025-06-08 18:23:13,212 INFO src.preprocessing.gdrive_manager: Uploaded transcripts\Overview and Key Components of Agent SDK.txt to Drive folder 1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3
+2025-06-08 18:23:14,602 INFO src.preprocessing.gdrive_manager: Deleted file 1SZZWmURjm3CCmUp4UKLsh_7KIdN8CYSS from Drive
+2025-06-08 18:23:15,609 INFO src.main_flow: Processing mentor materials...
+2025-06-08 18:23:15,678 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:23:19,895 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent SDK_V1_24-04-25.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:23:19,982 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:23:22,500 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent_SDK_+_Google_SDK.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:23:24,506 INFO src.main_flow: Generating quality reports...
+2025-06-08 18:23:24,532 INFO src.report_generation.report_generator: Generating report for: Overview and Key Components of Agent SDK
+2025-06-08 18:23:29,489 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:23:29,496 INFO src.report_generation.report_generator: Report saved to reports\report_Overview and Key Components of Agent SDK.txt
+2025-06-08 18:23:31,497 INFO src.report_generation.report_generator: Generating report for: Use case of Agent SDK
+2025-06-08 18:23:36,063 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:23:36,066 INFO src.report_generation.report_generator: Report saved to reports\report_Use case of Agent SDK.txt
+2025-06-08 18:23:38,070 INFO src.report_generation.report_generator: Generating report for: Working of Agent SDK
+2025-06-08 18:23:44,521 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:23:44,526 INFO src.report_generation.report_generator: Report saved to reports\report_Working of Agent SDK.txt
+2025-06-08 18:23:46,633 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:23:49,116 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Overview and Key Components of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:23:50,927 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Use case of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:23:53,100 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Working of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:50:48,799 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:50:48,799 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:50:52,608 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:50:57,758 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:51:00,362 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:51:04,124 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:51:05,284 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:51:05,302 INFO src.main_flow: Processing mentor materials...
+2025-06-08 18:51:05,577 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:51:08,061 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent SDK_V1_24-04-25.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:51:08,374 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:51:10,776 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent_SDK_+_Google_SDK.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:51:11,792 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf?usp=sharing
+2025-06-08 18:51:12,074 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:51:13,344 INFO src.main_flow: Transcript for Use case of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:51:13,345 INFO src.main_flow: Transcript for Working of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:51:13,346 INFO src.main_flow: Transcript for Overview and Key Components of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:51:15,413 INFO src.main_flow: Generating quality reports...
+2025-06-08 18:51:15,480 INFO src.report_generation.report_generator: Generating report for: Overview and Key Components of Agent SDK
+2025-06-08 18:51:20,062 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:51:20,069 INFO src.report_generation.report_generator: Report saved to reports\report_Overview and Key Components of Agent SDK.txt
+2025-06-08 18:51:22,075 INFO src.report_generation.report_generator: Generating report for: Use case of Agent SDK
+2025-06-08 18:51:26,277 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:51:26,281 INFO src.report_generation.report_generator: Report saved to reports\report_Use case of Agent SDK.txt
+2025-06-08 18:51:28,284 INFO src.report_generation.report_generator: Generating report for: Working of Agent SDK
+2025-06-08 18:51:33,604 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:51:33,607 INFO src.report_generation.report_generator: Report saved to reports\report_Working of Agent SDK.txt
+2025-06-08 18:51:35,670 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:51:37,987 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Overview and Key Components of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:51:40,428 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Use case of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:51:42,394 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Working of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:53:06,984 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:06,985 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:06,984 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:09,515 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:13,865 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:16,430 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:20,224 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:21,497 INFO src.main_flow: Initializing MainFlow with config: config/config.json
+2025-06-08 18:53:21,581 INFO src.main_flow: Processing mentor materials...
+2025-06-08 18:53:22,202 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:53:24,622 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent SDK_V1_24-04-25.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:53:25,001 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:53:27,236 INFO src.preprocessing.gdrive_manager: Uploaded mentor_materials\Agent_SDK_+_Google_SDK.txt to Drive folder 1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh
+2025-06-08 18:53:28,270 INFO src.main_flow: Processing Google Drive folder: https://drive.google.com/drive/folders/1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf?usp=sharing
+2025-06-08 18:53:28,378 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:53:29,666 INFO src.main_flow: Transcript for Use case of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:53:29,668 INFO src.main_flow: Transcript for Working of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:53:29,668 INFO src.main_flow: Transcript for Overview and Key Components of Agent SDK already exists in Drive. Skipping video.
+2025-06-08 18:53:31,675 INFO src.main_flow: Generating quality reports...
+2025-06-08 18:53:31,709 INFO src.report_generation.report_generator: Generating report for: Overview and Key Components of Agent SDK
+2025-06-08 18:53:37,017 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:53:37,022 INFO src.report_generation.report_generator: Report saved to reports\report_Overview and Key Components of Agent SDK.txt
+2025-06-08 18:53:39,025 INFO src.report_generation.report_generator: Generating report for: Use case of Agent SDK
+2025-06-08 18:53:42,574 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:53:42,576 INFO src.report_generation.report_generator: Report saved to reports\report_Use case of Agent SDK.txt
+2025-06-08 18:53:44,580 INFO src.report_generation.report_generator: Generating report for: Working of Agent SDK
+2025-06-08 18:53:49,005 INFO httpx: HTTP Request: POST https://tst123451307193883.openai.azure.com//openai/deployments/gpt-4o-mini/chat/completions?api-version=2025-01-01-preview "HTTP/1.1 200 OK"
+2025-06-08 18:53:49,008 INFO src.report_generation.report_generator: Report saved to reports\report_Working of Agent SDK.txt
+2025-06-08 18:53:51,061 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0
+2025-06-08 18:53:53,301 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Overview and Key Components of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:53:55,368 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Use case of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:53:57,568 INFO src.preprocessing.gdrive_manager: Uploaded reports\report_Working of Agent SDK.txt to Drive folder 1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H
+2025-06-08 18:53:58,629 INFO googleapiclient.discovery_cache: file_cache is only supported with oauth2client<4.0.0

reports/report_Overview and Key Components of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,53 @@

+1a: [✅] The transcript covers the topic of the agent SDK and its key components, including goals, tools, memory, and the reasoning loop.
+1b: [✅] Concepts are introduced in a structured manner, starting from the introduction of the agent SDK to its components and examples.
+1c: [✅] All statements appear to be technically correct and relevant to the topic discussed.
+1d: [✅] Relevant examples are provided, such as the interaction between the user and the AI agent regarding AI trends.
+2a: [N/A] There are no code demonstrations in the transcript.
+2b: [N/A] There are no code components to explain in the transcript.
+2c: [N/A] No libraries or tools are explicitly mentioned in a coding context.
+2d: [N/A] There are no code outputs to validate in the transcript.
+2e: [N/A] There are no hands-on activities mentioned.
+3a: [✅] The speech is coherent and the pacing is appropriate for understanding.
+3b: [✅] There are minimal filler words present in the transcript.
+3c: [✅] Technical terms are pronounced clearly in the context of the transcript.
+3d: [✅] The language used is formal and academic.
+3e: [✅] There are no inappropriate or biased statements present.
+4a: [✅] The spoken content follows the logical order of the topics discussed.
+5a: [❌] There are no explicit calls to action or prompts for reflection included in the transcript.
+5b: [❌] The transcript does not include rhetorical questions to engage learners.
+5c: [❌] There is no encouragement for feedback or queries from learners.
+6a: [✅] The introduction sets the context clearly for the discussion on agent SDK.
+6b: [✅] Transitions between sections are clear and logical.
+7a: [✅] The tone is encouraging and positive throughout the transcript.
+7b: [✅] The language used is inclusive and gender-neutral.
+8a: [✅] The pacing of the discussion appears to match the time markers provided.
+What Went Wrong:
+- Lack of engagement prompts for learners.
+- No rhetorical questions or invitations for feedback.
+How to Improve:
+- Include calls to action or prompts for learners to reflect on the content.
+- Add rhetorical questions to engage the audience and encourage interaction.

reports/report_Use case of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,51 @@

+1a: [✅] The transcript covers the main topic of building an AI agent using Google SDK and Agent SDK, including subtopics such as API key generation and memory storage.
+1b: [✅] Concepts are introduced in a logical order, starting from the problem statement to the coding process and enhancements.
+1c: [✅] All statements appear to be technically correct, with no evident conceptual inaccuracies.
+1d: [✅] Relevant examples are provided, such as the specific search query used to demonstrate the AI agent's functionality.
+2a: [✅] Code demonstrations are explained clearly, detailing the steps taken in the coding process.
+2b: [✅] The explanation of code components, such as API keys and search engine IDs, is thorough.
+2c: [✅] All libraries and tools used, such as Google API Python client and OpenAI API, are explicitly named and explained.
+2d: [✅] Expected outputs are described, including the results returned by the AI agent.
+2e: [✅] The pacing of the hands-on activities is appropriate for learners to follow along.
+3a: [✅] The speech is coherent and paced well, making it easy to understand.
+3b: [✅] There is minimal use of filler words throughout the transcript.
+3c: [✅] Technical terms are pronounced clearly, aiding comprehension.
+3d: [✅] The language used is formal and respectful, suitable for an academic setting.
+3e: [✅] There are no inappropriate or biased statements present.
+4a: [✅] The spoken content follows the logical sequence of the topics discussed.
+5a: [✅] There are prompts for learners to try things themselves, such as downloading the code.
+5b: [✅] Rhetorical questions are included to engage learners, enhancing interactivity.
+5c: [✅] The speaker encourages feedback and questions, promoting learner engagement.
+6a: [✅] The session begins with a clear introduction that sets the context for the topic.
+6b: [✅] Clear transitions between sections are indicated, helping maintain flow.
+7a: [✅] The tone is encouraging and positive, motivating learners throughout the session.
+7b: [✅] The language is inclusive and gender-neutral, accommodating diverse backgrounds.
+8a: [✅] The pacing of the session aligns with the time markers mentioned.
+What Went Wrong:
+- None identified.
+How to Improve:
+- None identified.

reports/report_Working of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,39 @@

+1a: [✅] The topic of how the agent SDK works is mentioned and explained, focusing on its functionality and process.
+1b: [✅] The explanation follows a logical order, starting from setting a goal to the output display.
+1c: [✅] All statements regarding the agent SDK's operation are technically correct.
+1d: [✅] An example of adding two numbers in Python is provided, which helps clarify the concept.
+2a: [❌] There is no code demonstration provided in the transcript.
+2b: [N/A] Not applicable as there is no code walkthrough.
+2c: [N/A] Not applicable as there is no code demonstration.
+2d: [N/A] Not applicable as there is no code demonstration.
+2e: [N/A] Not applicable as there is no code demonstration.
+3a: [✅] The speech is coherent and understandable.
+3b: [✅] There are minimal filler words present.
+3c: [✅] Technical terms are pronounced clearly.
+3d: [✅] The language used is formal and respectful.
+3e: [✅] There are no inappropriate or biased statements.
+4a: [✅] The spoken content aligns with the logical flow of the topic discussed.
+5a: [❌] There are no prompts for learner engagement or calls to action.
+5b: [❌] No rhetorical questions are included to engage learners.
+5c: [❌] There is no invitation for feedback or queries from learners.
+6a: [✅] The introduction sets the context for the discussion about the agent SDK.
+6b: [✅] Transitions between concepts are clear and logical.
+7a: [✅] The tone is encouraging and positive throughout the explanation.
+7b: [✅] The language used is inclusive and gender-neutral.
+8a: [✅] The pacing of the discussion appears to match the time markers provided.
+8b: [N/A] Not applicable as there are no specific time management indicators mentioned.
+What Went Wrong:
+- Lack of code demonstration and explanation of code components.
+- No engagement prompts or questions to involve learners.
+How to Improve:
+- Include a code demonstration with clear explanations of components and expected outputs.
+- Add engagement prompts, such as questions or calls to action, to encourage learner interaction.

requirements.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+streamlit
+python-dotenv
+azure-cognitiveservices-speech
+openai
+nbformat
+python-pptx
+ffmpeg-python
+google-auth
+google-api-python-client
+google-auth-httplib2
+google-auth-oauthlib

src/__init__.py ADDED Viewed

File without changes

src/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (139 Bytes). View file

src/__pycache__/main_flow.cpython-312.pyc ADDED Viewed

Binary file (11.8 kB). View file

src/main_flow.py ADDED Viewed

	@@ -0,0 +1,195 @@

+# src/main_flow.py
+from src.preprocessing.gdrive_manager import GoogleDriveManager
+from src.preprocessing.download_manager import GoogleDriveDownloader
+from src.preprocessing.video_processor import VideoProcessor
+from src.preprocessing.transcript_generator import TranscriptGenerator
+from src.preprocessing.file_processor import FileProcessor
+from src.report_generation.openai_client import OpenAIClient
+from src.report_generation.report_generator import ReportGenerator
+import json
+import os
+import glob
+import asyncio
+import logging
+import tempfile
+import shutil
+import googleapiclient.errors
+logger = logging.getLogger(__name__)
+class MainFlow:
+    def __init__(self, config_path: str):
+        logger.info("Initializing MainFlow with config: %s", config_path)
+        with open(config_path) as f:
+            self.config = json.load(f)
+        self.paths = self.config["PATHS"]
+        self.drive_folders = {
+            "VIDEOS": "1angHYyiE_sPTKpRsrHyPAJkYF7b78iPf",
+            "AUDIOS": "1bLbSXaO3AS-EuBg_o7sGc8AonkHt7SdG",
+            "TRANSCRIPTS": "1TbqLgYXOguxYivMiy17s1UVqUKxpGtt3",
+            "REPORTS": "1JgwDdQVc1YsyKNhag5l1PdD607vMjy1H",
+            "MENTOR_MATERIALS": "1OVhmzLD5NHmrHknSSWwAYC_NVlD39-sh"
+        }
+        self._create_directories()
+    def _create_directories(self):
+        for path in self.paths.values():
+            os.makedirs(path, exist_ok=True)
+    async def process_drive_url(self, folder_url: str):
+        logger.info("Processing Google Drive folder: %s", folder_url)
+        VideoProcessor.clean_directory(self.paths["VIDEOS"])
+        VideoProcessor.clean_directory(self.paths["AUDIOS"])
+        download_manager = GoogleDriveDownloader(self.paths["VIDEOS"], self.drive_folders)
+        gdrive = download_manager.gdrive
+        # Get all video files in Drive
+        video_files = download_manager.list_all_videos(folder_url)
+        if not video_files:
+            logger.warning("No videos to process in folder: %s", folder_url)
+            return
+        # Get all transcript files in Drive Transcripts folder
+        transcript_drive_files = gdrive.list_txt_files(self.drive_folders["TRANSCRIPTS"])
+        transcript_names = {os.path.splitext(f['name'])[0] for f in transcript_drive_files}
+        for video in video_files:
+            base_name = os.path.splitext(video['name'])[0]
+            if base_name in transcript_names:
+                logger.info(f"Transcript for {base_name} already exists in Drive. Skipping video.")
+                continue
+            # Download and process this video
+            local_video_path = os.path.join(self.paths["VIDEOS"], video['name'])
+            gdrive.download_file(video['id'], local_video_path)
+            logger.info(f"Downloaded: {video['name']}")
+            video_id = video['id']
+            video_name = video['name']
+            video_path = local_video_path
+            audio_path = os.path.join(self.paths["AUDIOS"], f"{base_name}.wav")
+            transcript_path = os.path.join(self.paths["TRANSCRIPTS"], f"{base_name}.txt")
+            video_processor = VideoProcessor()
+            transcript_generator = TranscriptGenerator(
+                os.getenv("AZURE_SPEECH_KEY"),
+                os.getenv("AZURE_SPEECH_REGION")
+            )
+            try:
+                # Convert video to audio
+                if video_processor.convert_mp4_to_wav(video_path, audio_path):
+                    logger.info("Converted video to audio: %s", audio_path)
+                    # Upload audio to Drive
+                    download_manager.upload_to_drive(audio_path, "AUDIOS", "audio/wav")
+                    # Delete video from Drive and local
+                    try:
+                        download_manager.delete_drive_file(video_id)
+                    except googleapiclient.errors.HttpError as e:
+                        if e.resp.status == 403:
+                            logger.warning(f"Skipping delete for {video_name} due to insufficient permissions.")
+                        else:
+                            logger.error(f"Error deleting video from Drive: {e}")
+                    try:
+                        os.remove(video_path)
+                    except Exception as e:
+                        logger.warning(f"Could not delete local video file: {e}")
+                    # Generate transcript
+                    if transcript_generator.transcribe_audio(audio_path, transcript_path):
+                        logger.info(f"Generated transcript: {transcript_path}")
+                        # Upload transcript to Drive
+                        download_manager.upload_to_drive(transcript_path, "TRANSCRIPTS", "text/plain")
+                        # Delete audio from Drive and local
+                        audio_drive_id = gdrive.find_file_by_name(self.drive_folders["AUDIOS"], f"{base_name}.wav")
+                        if audio_drive_id:
+                            try:
+                                download_manager.delete_drive_file(audio_drive_id)
+                            except googleapiclient.errors.HttpError as e:
+                                if e.resp.status == 403:
+                                    logger.warning(f"Skipping delete for audio {base_name}.wav due to insufficient permissions.")
+                                else:
+                                    logger.error(f"Error deleting audio from Drive: {e}")
+                        try:
+                            os.remove(audio_path)
+                        except Exception as e:
+                            logger.warning(f"Could not delete local audio file: {e}")
+                    else:
+                        logger.error(f"Failed to generate transcript for {video_name}")
+                else:
+                    logger.error(f"Failed to convert video: {video_name}")
+            except googleapiclient.errors.HttpError as e:
+                if e.resp.status == 403:
+                    logger.warning(f"Skipping file {video_name} due to insufficient permissions.")
+                else:
+                    logger.error(f"Google API error: {e}")
+            except Exception as e:
+                logger.error(f"Unexpected error processing {video_name}: {e}")
+    def process_mentor_materials(self, files: dict):
+        """Process mentor materials (PPTX/IPYNB)"""
+        logger.info("Processing mentor materials...")
+        processed_files = []
+        # Clean directory first
+        VideoProcessor.clean_directory(self.paths["MENTOR_MATERIALS"])
+        for file_type, file_data in files.items():
+            if not file_data:
+                continue
+            # Save uploaded file
+            file_path = os.path.join(self.paths["MENTOR_MATERIALS"], file_data.name)
+            with open(file_path, "wb") as f:
+                f.write(file_data.getbuffer())
+            # Process based on file type
+            base_name = os.path.splitext(file_data.name)[0]
+            output_path = os.path.join(self.paths["MENTOR_MATERIALS"], f"{base_name}.txt")
+            if file_type == "slides" and file_path.lower().endswith(('.pptx', '.ppt')):
+                content = FileProcessor.process_slide_file(file_path)
+            elif file_type == "notebook" and file_path.lower().endswith('.ipynb'):
+                content = FileProcessor.process_notebook_file(file_path)
+            else:
+                logger.error(f"Unsupported file type: {file_data.name}")
+                continue
+            # Save processed content
+            with open(output_path, 'w', encoding='utf-8') as f:
+                f.write(content)
+            # Remove original file
+            os.remove(file_path)
+            # Upload to Drive
+            gdrive = GoogleDriveManager()
+            gdrive.upload_file(output_path, self.drive_folders["MENTOR_MATERIALS"], "application/octet-stream")
+            processed_files.append(output_path)
+        return processed_files
+    def generate_quality_reports(self):
+        """Generate quality reports"""
+        logger.info("Generating quality reports...")
+        # Load checklist
+        with open("config/checklist.txt", "r") as f:
+            checklist = f.read()
+        # Initialize OpenAI client
+        openai_client = OpenAIClient("config/config.json")
+        client = openai_client.get_client()
+        deployment = openai_client.get_deployment()
+        report_generator = ReportGenerator(client, deployment, checklist)
+        report_generator.generate_reports(
+            self.paths["TRANSCRIPTS"],
+            self.paths["MENTOR_MATERIALS"],
+            self.paths["REPORTS"]
+        )
+        # Upload reports to Drive
+        gdrive = GoogleDriveManager()
+        for report_file in os.listdir(self.paths["REPORTS"]):
+            if report_file.endswith(".txt"):
+                local_path = os.path.join(self.paths["REPORTS"], report_file)
+                gdrive.upload_file(local_path, self.drive_folders["REPORTS"], "text/plain")

src/preprocessing/__pycache__/download_manager.cpython-312.pyc ADDED Viewed

Binary file (2.85 kB). View file

src/preprocessing/__pycache__/file_processor.cpython-312.pyc ADDED Viewed

Binary file (3.51 kB). View file

src/preprocessing/__pycache__/gdrive_manager.cpython-312.pyc ADDED Viewed

Binary file (5.91 kB). View file

src/preprocessing/__pycache__/transcript_generator.cpython-312.pyc ADDED Viewed

Binary file (4.69 kB). View file

src/preprocessing/__pycache__/video_processor.cpython-312.pyc ADDED Viewed

Binary file (2.46 kB). View file

src/preprocessing/download_manager.py ADDED Viewed

	@@ -0,0 +1,42 @@

+# src/preprocessing/download_manager.py
+import os
+import logging
+from .gdrive_manager import GoogleDriveManager
+logger = logging.getLogger(__name__)
+class GoogleDriveDownloader:
+    def __init__(self, download_path: str, drive_folders: dict):
+        self.download_path = download_path
+        os.makedirs(download_path, exist_ok=True)
+        self.gdrive = GoogleDriveManager()
+        self.drive_folders = drive_folders  # Dict with keys: VIDEOS, AUDIOS, TRANSCRIPTS, REPORTS, MENTOR_MATERIALS
+    def process_one_video(self, videos_folder_url: str):
+        videos_folder_id = self.gdrive.get_folder_id(videos_folder_url)
+        video_files = self.gdrive.list_files(videos_folder_id, 'video/mp4')
+        if not video_files:
+            logger.info("No videos found in Drive folder.")
+            return None
+        # Process only the first video
+        video = video_files[0]
+        local_video_path = os.path.join(self.download_path, video['name'])
+        self.gdrive.download_file(video['id'], local_video_path)
+        logger.info(f"Downloaded: {video['name']}")
+        return {
+            'id': video['id'],
+            'name': video['name'],
+            'path': local_video_path
+        }
+    def delete_drive_file(self, file_id):
+        self.gdrive.delete_file(file_id)
+    def upload_to_drive(self, local_path, folder_key, mime_type):
+        folder_id = self.drive_folders[folder_key]
+        return self.gdrive.upload_file(local_path, folder_id, mime_type)
+    def list_all_videos(self, videos_folder_url: str):
+        videos_folder_id = self.gdrive.get_folder_id(videos_folder_url)
+        return self.gdrive.list_files(videos_folder_id, 'video/mp4')

src/preprocessing/file_processor.py ADDED Viewed

	@@ -0,0 +1,52 @@

+# src/preprocessing/file_processor.py
+from pptx import Presentation
+import nbformat
+import re
+import os
+import logging
+logger = logging.getLogger(__name__)
+class FileProcessor:
+    @staticmethod
+    def process_slide_file(file_path: str) -> str:
+        try:
+            prs = Presentation(file_path)
+            content = []
+            for i, slide in enumerate(prs.slides):
+                content.append(f"=== Slide {i+1} ===")
+                for shape in slide.shapes:
+                    if hasattr(shape, "text") and shape.text.strip():
+                        cleaned_text = re.sub(r'\s+', ' ', shape.text.strip())
+                        content.append(cleaned_text)
+                content.append("")
+            return "\n".join(content)
+        except Exception as e:
+            logger.error(f"Error processing presentation: {str(e)}")
+            return ""
+    @staticmethod
+    def process_notebook_file(file_path: str) -> str:
+        try:
+            with open(file_path, 'r', encoding='utf-8') as f:
+                nb = nbformat.read(f, as_version=4)
+            content = []
+            for cell in nb.cells:
+                if cell.cell_type == 'code':
+                    content.append("## CODE CELL ##")
+                    content.append(cell.source.strip())
+                    content.append("----")
+                elif cell.cell_type == 'markdown':
+                    content.append("## MARKDOWN CELL ##")
+                    cleaned_text = cell.source.strip()
+                    cleaned_text = re.sub(r'#+\s*', '', cleaned_text)
+                    cleaned_text = re.sub(r'\*{1,2}(.*?)\*{1,2}', r'\1', cleaned_text)
+                    cleaned_text = re.sub(r'\[(.*?)\]\(.*?\)', r'\1', cleaned_text)
+                    content.append(cleaned_text)
+                    content.append("----")
+            return "\n".join(content)
+        except Exception as e:
+            logger.error(f"Error processing notebook: {str(e)}")
+            return ""

src/preprocessing/gdrive_manager.py ADDED Viewed

	@@ -0,0 +1,93 @@

+# src/gdrive_manager.py
+import os
+import io
+import logging
+from googleapiclient.discovery import build
+from googleapiclient.http import MediaIoBaseDownload, MediaFileUpload
+from googleapiclient.errors import HttpError
+from google.oauth2 import service_account
+logger = logging.getLogger(__name__)
+class GoogleDriveManager:
+    SCOPES = ['https://www.googleapis.com/auth/drive']
+    def __init__(self, credentials_file='credentials.json'):
+        creds = service_account.Credentials.from_service_account_file(
+            credentials_file, scopes=self.SCOPES
+        )
+        self.service = build('drive', 'v3', credentials=creds)
+    def get_folder_id(self, url):
+        """Extract folder ID from Google Drive URL"""
+        if 'folders/' in url:
+            return url.split('folders/')[-1].split('?')[0]
+        elif 'id=' in url:
+            return url.split('id=')[-1].split('&')[0]
+        return url
+    def list_files(self, folder_id, file_type='video/mp4'):
+        """List files in a Google Drive folder"""
+        query = f"'{folder_id}' in parents and mimeType='{file_type}' and trashed=false"
+        results = self.service.files().list(
+            q=query,
+            fields="files(id, name, mimeType)"
+        ).execute()
+        return results.get('files', [])
+    def download_file(self, file_id, destination):
+        """Download a file from Google Drive"""
+        logger.info("Downloading file %s to %s", file_id, destination)
+        request = self.service.files().get_media(fileId=file_id)
+        fh = io.FileIO(destination, 'wb')
+        downloader = MediaIoBaseDownload(fh, request)
+        done = False
+        while not done:
+            status, done = downloader.next_chunk()
+            logger.info(f"Download {int(status.progress() * 100)}%")
+        logger.info("Download complete: %s", destination)
+        return destination
+    def upload_file(self, local_path, drive_folder_id, mime_type):
+        """Upload a file to Google Drive"""
+        file_metadata = {
+            'name': os.path.basename(local_path),
+            'parents': [drive_folder_id]
+        }
+        media = MediaFileUpload(local_path, mimetype=mime_type)
+        file = self.service.files().create(
+            body=file_metadata,
+            media_body=media,
+            fields='id'
+        ).execute()
+        logger.info(f"Uploaded {local_path} to Drive folder {drive_folder_id}")
+        return file.get('id')
+    def delete_file(self, file_id):
+        """Delete a file from Google Drive"""
+        try:
+            self.service.files().delete(fileId=file_id).execute()
+            logger.info(f"Deleted file {file_id} from Drive")
+            return True
+        except HttpError as error:
+            logger.error(f"An error occurred: {error}")
+            return False
+    def find_file_by_name(self, folder_id, filename):
+        """Find a file by name in a folder"""
+        query = f"'{folder_id}' in parents and name='{filename}' and trashed=false"
+        results = self.service.files().list(
+            q=query,
+            fields="files(id)"
+        ).execute()
+        files = results.get('files', [])
+        return files[0]['id'] if files else None
+    def list_txt_files(self, folder_id):
+        """List all .txt files in a Google Drive folder"""
+        query = f"'{folder_id}' in parents and mimeType='text/plain' and trashed=false"
+        results = self.service.files().list(
+            q=query,
+            fields="files(id, name)"
+        ).execute()
+        return results.get('files', [])

src/preprocessing/transcript_generator.py ADDED Viewed

	@@ -0,0 +1,87 @@

+# src/preprocessing/transcript_generator.py
+import azure.cognitiveservices.speech as speechsdk
+import json
+import re
+import time
+import logging
+logger = logging.getLogger(__name__)
+class TranscriptGenerator:
+    def __init__(self, speech_key: str, speech_region: str):
+        self.speech_config = speechsdk.SpeechConfig(
+            subscription=speech_key,
+            region=speech_region
+        )
+        self.speech_config.request_word_level_timestamps = True
+        self.speech_config.output_format = speechsdk.OutputFormat.Detailed
+    def transcribe_audio(self, audio_file_path: str, output_text_file: str):
+        audio_config = speechsdk.audio.AudioConfig(filename=audio_file_path)
+        speech_recognizer = speechsdk.SpeechRecognizer(
+            speech_config=self.speech_config,
+            audio_config=audio_config
+        )
+        all_results = []
+        done = False
+        def handle_final_result(evt):
+            if evt.result.reason == speechsdk.ResultReason.RecognizedSpeech:
+                result_json = json.loads(evt.result.json)
+                if 'NBest' in result_json and result_json['NBest']:
+                    words = result_json['NBest'][0].get('Words', [])
+                    all_results.extend(words)
+        def stop_cb(evt):
+            nonlocal done
+            done = True
+        speech_recognizer.recognized.connect(handle_final_result)
+        speech_recognizer.session_stopped.connect(stop_cb)
+        speech_recognizer.canceled.connect(stop_cb)
+        speech_recognizer.start_continuous_recognition()
+        start_time = time.time()
+        while not done and time.time() - start_time < 1800:  # 30 min timeout
+            time.sleep(0.5)
+        speech_recognizer.stop_continuous_recognition()
+        # Process and save results
+        with open(output_text_file, "w", encoding="utf-8") as f:
+            f.write("start_time\tend_time\tspeaker\ttranscript\n")
+            current_sentence = []
+            current_start = None
+            current_end = None
+            for word in all_results:
+                word_start = word['Offset'] / 10000000
+                word_end = word_start + (word['Duration'] / 10000000)
+                word_text = word['Word']
+                if not current_sentence:
+                    current_start = word_start
+                    current_end = word_end
+                    current_sentence.append(word_text)
+                    continue
+                # Sentence boundary detection
+                time_gap = word_start - current_end
+                is_punctuation = re.match(r'^[.!?]+$', word_text)
+                if time_gap > 1.5 or is_punctuation:
+                    sentence_text = " ".join(current_sentence)
+                    f.write(f"{current_start:.2f}\t{current_end:.2f}\tSPEAKER\t{sentence_text}\n")
+                    current_sentence = [word_text]
+                    current_start = word_start
+                    current_end = word_end
+                else:
+                    current_sentence.append(word_text)
+                    current_end = word_end
+            if current_sentence:
+                sentence_text = " ".join(current_sentence)
+                f.write(f"{current_start:.2f}\t{current_end:.2f}\tSPEAKER\t{sentence_text}\n")
+        logger.info(f"Transcript saved to {output_text_file}")
+        return len(all_results) > 0

src/preprocessing/video_processor.py ADDED Viewed

	@@ -0,0 +1,51 @@

+# src/preprocessing/video_processor.py
+import os
+import subprocess
+import logging
+logger = logging.getLogger(__name__)
+class VideoProcessor:
+    @staticmethod
+    def clean_directory(directory: str):
+        for filename in os.listdir(directory):
+            file_path = os.path.join(directory, filename)
+            try:
+                if os.path.isfile(file_path):
+                    os.unlink(file_path)
+            except Exception as e:
+                logger.error(f"Error deleting {file_path}: {e}")
+    @staticmethod
+    def convert_mp4_to_wav(mp4_file_path: str, wav_file_path: str) -> bool:
+        try:
+            if not os.path.exists(mp4_file_path):
+                logger.error(f"Video file does not exist: {mp4_file_path}")
+                return False
+            command = [
+                "ffmpeg",
+                "-i", mp4_file_path,
+                "-vn",
+                "-acodec", "pcm_s16le",
+                "-ar", "16000",
+                "-ac", "1",
+                "-y",
+                wav_file_path
+            ]
+            result = subprocess.run(
+                command,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+                text=True
+            )
+            if result.returncode != 0:
+                logger.error(f"FFmpeg error: {result.stderr}")
+                return False
+            return True
+        except Exception as e:
+            logger.error(f"Conversion error: {str(e)}")
+            return False

src/report_generation/__pycache__/openai_client.cpython-312.pyc ADDED Viewed

Binary file (1.56 kB). View file

src/report_generation/__pycache__/report_generator.cpython-312.pyc ADDED Viewed

Binary file (5.44 kB). View file

src/report_generation/openai_client.py ADDED Viewed

	@@ -0,0 +1,25 @@

+# src/report_generation/openai_client.py
+from openai import AzureOpenAI
+import json
+import os
+import logging
+logger = logging.getLogger(__name__)
+class OpenAIClient:
+    def __init__(self, config_path: str):
+        with open(config_path) as f:
+            config = json.load(f)
+        self.client = AzureOpenAI(
+            azure_endpoint=config["AZURE_OPENAI_ENDPOINT"],
+            api_key=os.getenv("AZURE_OPENAI_KEY"),
+            api_version=config["AZURE_OPENAI_APIVERSION"]
+        )
+        self.deployment_name = config["CHATGPT_MODEL"]
+    def get_client(self) -> AzureOpenAI:
+        return self.client
+    def get_deployment(self) -> str:
+        return self.deployment_name

src/report_generation/report_generator.py ADDED Viewed

	@@ -0,0 +1,120 @@

+# src/report_generation/report_generator.py
+import os
+import glob
+import time
+import logging
+from typing import Dict
+logger = logging.getLogger(__name__)
+class ReportGenerator:
+    def __init__(self, openai_client, deployment_name: str, checklist: str):
+        self.client = openai_client
+        self.deployment_name = deployment_name
+        self.checklist = checklist
+    def quality_check(self, transcript_content: str, material_type: str, material_content: str = None) -> str:
+        material_context = ""
+        if material_content:
+            if material_type == "slides":
+                material_context = f"\n### SLIDE CONTENT ###\n{material_content}"
+            elif material_type == "notebook":
+                material_context = f"\n### NOTEBOOK CONTENT ###\n{material_content}"
+        user_input = f"""
+### VIDEO TRANSCRIPT ###
+{transcript_content}
+{material_context}
+### TASK ###
+Review using this checklist:
+{self.checklist}
+### INSTRUCTIONS ###
+1. For EACH checklist item:
+   - Respond using format: [✅/❌/N/A] [Brief explanation]
+2. After checklist, provide:
+   - "What Went Wrong:" (bullet points)
+   - "How to Improve:" (bullet points)
+3. Use ONLY this format:
+### RESPONSE FORMAT ###
+1a: [✅/❌/N/A] [Explanation]
+...
+8b: [✅/❌/N/A] [Explanation]
+What Went Wrong:
+- [Issue 1]
+- [Issue 2]
+How to Improve:
+- [Recommendation 1]
+- [Recommendation 2]
+"""
+        try:
+            response = self.client.chat.completions.create(
+                model=self.deployment_name,
+                messages=[
+                    {"role": "system", "content": "You are an analytical quality assurance assistant."},
+                    {"role": "user", "content": user_input}
+                ],
+                temperature=0.2,
+                max_tokens=4096,
+                top_p=0.95
+            )
+            return response.choices[0].message.content.strip()
+        except Exception as e:
+            logger.error(f"Azure OpenAI error: {str(e)}")
+            return f"Error in quality check: {str(e)}"
+    def generate_reports(self, transcript_path: str, mentor_materials_path: str, reports_dir: str):
+        # Create reports directory if not exists
+        os.makedirs(reports_dir, exist_ok=True)
+        # Get all transcript files
+        video_transcripts = []
+        for file_path in glob.glob(os.path.join(transcript_path, "*.txt")):
+            with open(file_path, 'r', encoding='utf-8') as f:
+                video_transcripts.append({
+                    "path": file_path,
+                    "content": f.read(),
+                    "base_name": os.path.splitext(os.path.basename(file_path))[0]
+                })
+        if not video_transcripts:
+            logger.error("No video transcripts found!")
+            return
+        # Get mentor materials
+        mentor_contents: Dict[str, str] = {}
+        for file_path in glob.glob(os.path.join(mentor_materials_path, "*.txt")):
+            base_name = os.path.splitext(os.path.basename(file_path))[0]
+            with open(file_path, 'r', encoding='utf-8') as f:
+                mentor_contents[base_name] = f.read()
+        # Generate reports
+        for video in video_transcripts:
+            base_name = video["base_name"]
+            logger.info(f"Generating report for: {base_name}")
+            material_content = mentor_contents.get(base_name, "")
+            material_type = ""
+            if "slide" in base_name.lower():
+                material_type = "slides"
+            elif "notebook" in base_name.lower():
+                material_type = "notebook"
+            report = self.quality_check(
+                video["content"],
+                material_type,
+                material_content
+            )
+            report_file = os.path.join(reports_dir, f"report_{base_name}.txt")
+            with open(report_file, 'w', encoding='utf-8') as f:
+                f.write(report)
+            logger.info(f"Report saved to {report_file}")
+            time.sleep(2)  # Avoid rate limiting

transcripts/Overview and Key Components of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+start_time	end_time	speaker	transcript
+5.53	7.41	SPEAKER	introduction to agent SDK
+9.23	15.39	SPEAKER	what is agent SDK actually it is a software development kit
+16.95	51.71	SPEAKER	toolkit for building autonomous AI agents automatic workable AI agents can be generated with the help of agent SDK which will always provide a platform a resource and tools and libraries in order to develop these AI agents then it will also help to create a flexible and reusable AI systems later it will enable the integration of certain goals tools and memory in agents
+53.48	125.15	SPEAKER	so agent SDK plays a very important role in order to build an AI agent so this is a brief intro about agent SDK let's understand the key components of agent SDK what are the key components do we have first goal meaning a human is giving prompt to the AI system that is the goal for the AI system the requirement received from the user end terms to be the goal for the agent then tools what are the tools it will involve in order to create a specified result a relevant result tools lays an important role than memory after finding the results where it will store obviously in the memory so memory is also a key component of agent SDK then reasoning loop the chat that happens between the agent and the human or the user
+126.98	228.99	SPEAKER	this is reasoning loop first i will ask agent or AI system hi how are you i will get a response i'm good how can i help you from the agent right so this conversation will go on please list top AI trends for twenty twenty five is the goal for example what are the tools the web search it will make the integrated apis into that AI system plays a role of tool memory first it will store it will search it will store five to six courses or trends with respect to the artificial intelligence it will list back end it will be stored in the memory then after storing what happens it will list the AI trends of twenty twenty five in the output screen once this is listed the user will try to change or tweak their particular prompt how they will change maybe this time data science oriented trends they're asking for a second goal now and sometimes they might also ask out of six trends which you have listed which is the best so again it will go to a thinking mode this reasoning will go on loop until unless the user exits from the AI system this is just a common example which i tried to give you in order to relate the key components of agent SDK

transcripts/Use case of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,16 @@

+start_time	end_time	speaker	transcript
+5.21	75.91	SPEAKER	now it's time to explore problem statement where it involves agent SDK and google SDK both of the use cases combined together in one program addressing one problem statement let's hop on to google collab and understand how the problem statement is listed and what is our solution how do we resolve the same let's quickly hop on to google platform here we are on the google collab platform addressing our problem statement which involves google SDK indeed agent SDK as well so what do we do here we are trying to build AI agent using google SDK to automate real time web search tasks what's happening here what's our objective we have to develop a simple autonomous AI agent that takes a user defined goal it performs a real time web search using google custom search API
+77.59	150.19	SPEAKER	that is google SDK and presents relevant results to the user the agent should also retain memory of the past goals and result for reference so this is the objective and the problem statement basically we are trying to build an AI agent which will have a custom web search task on real time what are the key features of this it will accept the user defined goal that is a search query that's the prompt it will use google custom search API to fetch top search results that is the tool display the top three results including title URL and a snippet this is the result it will store the goal and results in the memory for future use also it will provide an option to refine the goal manually or conclude the session basically this is addressing in a manual perspective but serving the purpose of problem statement so these are the key features will be learning
+151.96	226.03	SPEAKER	when we learn about this particular code then what is the expected outcome of this as i told you we have a goal we have a tool that is google custom search API action is nothing but searching for those particular top three results of the goal whatever it has been set and then displaying those three urls with title and snippet is the result then the real time search result deliver based on user inputs that's the expected outcome then a memory system that logs all goals and search outcomes during this session so this is the overall goal expected outcome and problem statement the features and objectives hope we are clear and set now let's understand the coding my codes are generally very self explanatory so it's easy to understand indeed i'll also be explaining how does these things work here
+227.75	259.12	SPEAKER	first what do we do we install the required package what is the package that is google API python client we are using pip install and we are trying to install the required package then we have to import certain modules so we have to import from google API client we import which is called build that's the module we are trying to build the AI agent right
+261.12	278.40	SPEAKER	now in order to interact we should know two important things one API key you have to replace with your own API key when you are working this is my API key which has been set search engine ID
+280.59	314.32	SPEAKER	that is google search engine ID you can replace that with your own so that's why i have mentioned in the comment replace these two keys accordingly OK then we are sorted with API configuration now the question is where do i find the API key and where do i find the search engine ID i'll quickly give you a walk through where you can find and how you can generate then we will proceed with the further code
+316.74	518.87	SPEAKER	let's understand how do we generate API key overall i'm just giving a gist of how do we do this first we have to go to google cloud there we have to select credentials once we select credentials you have an option to create credentials what kind of credential you can create let's see click on that you have different kinds of credentials available the first thing is API key click on the API key it will start creating your key ensure your particular API key is copied as and when it is created you can just copy this and paste it in a secure place right so once it's created you can close this if you want to see the API key you can click on show key it will show you that particular API key i'll close this if you want to edit something you can edit the API key here let's see what are the things we have here restrictions i've got no restrictions if you want certain websites to be restricted or certain i addresses restricted you can select them don't restrict key i have just put this across so it's by default i have not done anything it's just i've generated the API key and if you want to change the name you can change it here as well and save for now i'm not changing anything i'm just keeping as it is so you can copy that particular key go back and paste it here that is the API key now we have one more thing that is called search engine so what is the search engine ID where do we get this we will have a look at that as well you have to go to programmable search engine on google chrome you will get a screen like this there is no search engines created here first time we are creating so we'll click on create your first search engine once you do this you can give a name for your search engine what are the different sites you want to list you can list individual pages as well you can also list the parts of a site as well so what i'm doing i'm keeping it universal i'm keeping it WWW dot google dot com so the complete google search engine is customized so now we will enable image search and save search both so do not forget to click on add here once you do this see you have your particular URL listed here the website generally so i'm not a robot i'll just click this and you press on create once you do that you can see a preview here it's in the format of script right HTML script so you go to customize once you go to customize you will get a search engine ID copy this if you want URL you have an URL as well which is also ending with the same search engine ID you can see both are same now
+520.51	539.59	SPEAKER	O what are the different search features enabled as by default it was image search save search if you want to search the entire web you can toggle this as well if you want to see any advanced all features of settings you can see here
+541.32	772.23	SPEAKER	so query enhancement if you want to add keywords specifically you can add it so you have all these features available if you want to restrict certain pages you can restrict basically you can enable a custom google search engine that is what i meant to say so i think you're clear with how do you get your search engine ID so i'm just going back again just showing you this it is available in the code format as well if you want to describe you can give a description too you have to just copy the search engine ID get back to your code and replace in the relevant place here right this is about the API configuration which you have to set hope we are clear with this step now let's proceed with the next steps memory to store past goals and results whatever you search with the help of your custom google SDK it has to be stored right for that you have to create a open space the memory space after assigning a memory space next we have to define the tool function using google SDK why do we do this we have to ensure the google search is happening for the query which has been given it has to search with the help of what with the help of two things one the API key which is integrated and the search engine ID that search engine is not a normal open public search engine it is a custom google search engine which we have created and added that i'd into our code hope we are clear until here next we have to define the AI agents reasoning loop what is this reasoning loop it involves received goal the prompt which is received from the user then we will use google search tool which is created then we will display top three results it will have the result title URL and the snippet if any then we will store that in the memory with the help of memory append function we are trying to append the goal and the results so how many goals and results are stored that has been totaled total stored goals the numbers as been mentioned here next we are done with our goal tool and memory let's see what we can do next real time interaction i am just trying to give the real time feel of interaction with the SDK first it will state a welcome statement it will be printed then it will ask to enter your search goal what is your search goal for example top AI research labs in twenty twenty five i will be typing the same then we will run when you run what will happen it will go to the reasoning loop which we have created here right after it enters the reasoning loop it will finish all the assigned functions once it completes the execution of the functions in the reasoning loop it will show all the memory at the end so again you will have a for loop for that and we will try to list everything out so this is about the code of generating a custom search engine with the help of google SDK so the agent has been built let's run
+776.53	785.57	SPEAKER	the output is this way let us try to take all the apis the google authentications everything
+787.42	798.94	SPEAKER	it is asking enter your search goal after welcoming us to AI agent plus google SDK so i am typing the same top AI
+801.69	810.91	SPEAKER	research labs in twenty twenty five OK i'm clicking on enter once i do that
+813.06	869.11	SPEAKER	agent has received the goal that is top AI research labs in twenty twenty five the tool is searching in google for the same then the AI has got top three results what are these results as i mentioned it is having title URL and a snippet so here is the title result number one result number two and result number three so memory is stored goal and results total stored goals is one because i have given one single query right one single prompt so this is how it will list in the final memory log so this is how this particular code works when you integrate and try to understand how does an agent SDK key components and google SDK works
+871.24	1125.11	SPEAKER	now there is one small constraint if you have observed or not i'm not sure but i'll try to explain what are the constraints do we have in this code first the agent operates only with the manual refinement no AI generated refinements available that's the fault that's the disadvantage search is limited to what google 's custom search API can return and it is having the quota limits it is restricted what do you do now you have a enhancement solution what all you can do let GPT also summarize the search results you can enhance this drawbacks by integrating open AI API key into the same code how do you do this how realistic it will be let's understand more about this we have old constraint that is the manual refinement issue now you can automatically add the GPT the agent becomes self sufficient it will think refine act that is search learn that is stores in the memory then what is the flow of execution for this first agent receives the goal simple it will search in google using the goal this is what we were doing it now additional step is refining goal using GPT so when you have given top AI research labs in twenty twenty five it will try to refine with the help of GPT leading artificial intelligence research institutes of worldwide twenty twenty five so this is a refinement that has been given to the goal which is already provided by the user it will search in the google again using GPT refined goal and it will store both the goals and results both of it will be stored accordingly we are not changing the execution flow we are just adding the GPT version in middle that's it that's the only enhancement we are doing in order to keep it in realistic manner the same code you have imports you have API keys you have memory store tool number one tool number two tool number one is google search tool number two here this is the addition open AI GPT for refinement this is the tool number two we have we have a function called refine query with GPT for that we have integrated few of the elements so we have kept the temperature max tokens is fifty so all these restrictions is also been put up and refined query also it will generate and give then the AI agent reasoning loop will start like before right it will again display the top three results then refine goal using GPT then display again the refine results so first it will display as it is the original then it will go towards the refined goal then it will create the result which is having the refined result so both of it will be stored in the memory so this is how this particular code will work with the enhancement of open AI API key now you have to see one important thing with API key and search engine ID we also have open AI API key integrated so when you do this you have to go to open AI platform again it is only towards the paid version of chatgpt or open AI so you can just go to open AI platform generate the API key there and paste it right here so this is how the code will look like you will get this particular code in your course just download try to replace all the API keys and run this particular code we have seen the use cases where we have integrated
+1126.71	1160.83	SPEAKER	agent SDK and google SDK i mean agent SDKS key components the way it works it has been shown with the help of google SDK also there is a one small assignment you can just download this particular code try to execute the integration of open AI you can add the API key and try to run and check for the difference how realistic query looks like

transcripts/Working of Agent SDK.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+start_time	end_time	speaker	transcript
+5.11	27.55	SPEAKER	next how does this agent SDK work that's more important to know first as i mentioned setting up a goal that is prompting once the agent receives the prompt it will decide what's the tool in need for example if i say please provide
+29.24	65.67	SPEAKER	a simple program in order to add two numbers in python programming language so tool will be a python program right so next action it will try to write the code on behalf and it will try to display on the output screen which terms to be the result as simple as that it's not having much complicated elements involved we will prompt it will decide the tool the action will taken and the result will be displayed this is a simple working of agent SDK