Spaces:

abhishekjoel
/

AI_notes

Sleeping

App Files Files Community

abhishekjoel commited on Nov 14, 2024

Commit

af29e2b

verified ·

1 Parent(s): 2e97d93

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -7

app.py CHANGED Viewed

@@ -13,11 +13,16 @@ openai.api_key = os.getenv('OPENAI_API_KEY')
 # Function to transcribe audio using OpenAI Whisper
 def transcribe_audio(audio_file):
     try:
-        audio = AudioSegment.from_file(audio_file)
         buffer = io.BytesIO()
         audio.export(buffer, format="wav")
         buffer.seek(0)
         buffer.name = "audio.wav"
         response = openai.Audio.transcribe(
             "whisper-1",
             file=buffer,
@@ -30,15 +35,23 @@ def transcribe_audio(audio_file):
 # Function to extract text from PDF
 def extract_text_from_pdf(pdf_file):
-    reader = PyPDF2.PdfReader(pdf_file)
-    text = ""
-    for page in reader.pages:
-        text += page.extract_text() + "\n"
-    return text
 # Function to get YouTube transcript
 def get_youtube_transcript(url):
     try:
         if "watch?v=" in url:
             video_id = url.split("watch?v=")[1].split("&")[0]
         elif "youtu.be/" in url:
@@ -46,9 +59,11 @@ def get_youtube_transcript(url):
         else:
             st.error("Invalid YouTube URL.")
             return None
         transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
         transcript = transcript_list.find_transcript(['en'])
         transcript_data = transcript.fetch()
         transcription_text = " ".join([entry['text'] for entry in transcript_data])
         return transcription_text
     except Exception as e:
@@ -77,7 +92,8 @@ def create_pdf(notes):
 # Main app
 def main():
-    st.title("AI Notes Generation bot")
     st.markdown("---")
     st.subheader("Upload your file:")
@@ -101,6 +117,9 @@ def main():
                 return
         elif input_type == "PDF Document" and pdf_input:
             transcription_text = extract_text_from_pdf(pdf_input)
         elif input_type == "YouTube URL" and youtube_input:
             transcription_text = get_youtube_transcript(youtube_input)
             if not transcription_text:

 # Function to transcribe audio using OpenAI Whisper
 def transcribe_audio(audio_file):
     try:
+        # Read the bytes from the uploaded audio file
+        audio_bytes = audio_file.read()
+        # Use io.BytesIO to create a file-like object
+        audio = AudioSegment.from_file(io.BytesIO(audio_bytes))
+        # Convert to WAV and prepare for transcription
         buffer = io.BytesIO()
         audio.export(buffer, format="wav")
         buffer.seek(0)
         buffer.name = "audio.wav"
+        # Transcribe audio using OpenAI Whisper
         response = openai.Audio.transcribe(
             "whisper-1",
             file=buffer,
 # Function to extract text from PDF
 def extract_text_from_pdf(pdf_file):
+    try:
+        # Read the bytes from the uploaded PDF file
+        pdf_bytes = pdf_file.read()
+        # Use io.BytesIO to create a file-like object
+        reader = PyPDF2.PdfReader(io.BytesIO(pdf_bytes))
+        text = ""
+        for page in reader.pages:
+            text += page.extract_text() + "\n"
+        return text
+    except Exception as e:
+        st.error(f"Error processing PDF: {str(e)}")
+        return None
 # Function to get YouTube transcript
 def get_youtube_transcript(url):
     try:
+        # Extract video ID from URL
         if "watch?v=" in url:
             video_id = url.split("watch?v=")[1].split("&")[0]
         elif "youtu.be/" in url:
         else:
             st.error("Invalid YouTube URL.")
             return None
+        # Fetch transcript
         transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
         transcript = transcript_list.find_transcript(['en'])
         transcript_data = transcript.fetch()
+        # Combine transcript texts
         transcription_text = " ".join([entry['text'] for entry in transcript_data])
         return transcription_text
     except Exception as e:
 # Main app
 def main():
+    st.set_page_config(layout="wide")
+    st.markdown("<h1 style='text-align: center;'>AI Notes Generation Bot 🤖</h1>", unsafe_allow_html=True)
     st.markdown("---")
     st.subheader("Upload your file:")
                 return
         elif input_type == "PDF Document" and pdf_input:
             transcription_text = extract_text_from_pdf(pdf_input)
+            if not transcription_text:
+                st.error("Failed to extract text from PDF.")
+                return
         elif input_type == "YouTube URL" and youtube_input:
             transcription_text = get_youtube_transcript(youtube_input)
             if not transcription_text: