Agent_course_Final_Assignment

Sleeping

RCaz commited on Nov 8, 2025

Commit

2bcf72e

verified ·

1 Parent(s): bea827c

Update agent.py

Files changed (1) hide show

agent.py CHANGED Viewed

@@ -18,6 +18,46 @@ def extract_text_from_audio(file_path : str) -> str:
     return text
 class TestAgent:
     def __init__(self):

     return text
+@tool
+def extract_text_from_audio(file_path: str) -> str:
+    """
+    Extract and return text transcription from an audio file using speech recognition.
+    This tool uses Google's speech recognition API to convert spoken audio content
+    into text. It supports various audio formats including WAV, AIFF, and FLAC
+    (formats supported by the SpeechRecognition library).
+    Args:
+        file_path (str): Path to the audio file to be transcribed. The file should
+                        be in a format compatible with the SpeechRecognition library.
+    Returns:
+        str: The extracted text content from the audio file.
+    Raises:
+        Exception : the exception
+    Examples:
+        >>> extract_text_from_audio("meeting_recording.wav")
+        "Hello team, welcome to our weekly meeting..."
+        >>> extract_text_from_audio("/path/to/audio/interview.mp3")
+        "Could you please introduce yourself and your background?"
+    """
+    import speech_recognition as sr
+    r = sr.Recognizer()
+    try:
+        with sr.AudioFile(file_path) as source:
+            # listen for the data (load audio to memory)
+            audio_data = r.record(source)
+            # recognize (convert from speech to text)
+            text = r.recognize_google(audio_data)
+        return text
+    except Exception as e:
+        return e
 class TestAgent:
     def __init__(self):