Spaces:

Arslan17121
/

AudioNotebook

Sleeping

App Files Files Community

Arslan17121 commited on Dec 31, 2024

Commit

8cf3d5d

verified ·

1 Parent(s): 498090e

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -63

app.py CHANGED Viewed

@@ -1,47 +1,21 @@
-import streamlit as st
-import pdfplumber
-from transformers import pipeline
-from gtts import gTTS
-import os
-# Function to extract text from PDF
-def extract_text_from_pdf(pdf_file):
-    text = ""
-    try:
-        with pdfplumber.open(pdf_file) as pdf:
-            for page in pdf.pages:
-                text += page.extract_text() or ""
-    except Exception as e:
-        st.error(f"Error reading the PDF: {e}")
-    return text
-# Function to generate discussion points
-def generate_discussion_points(text):
-    try:
-        summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
-        summary = summarizer(text, max_length=130, min_length=30, do_sample=False)
-        return summary[0]['summary_text']
-    except Exception as e:
-        st.error(f"Error during summarization: {e}")
-        return None
-# Function to convert text to speech
-def text_to_speech(text, output_file="output.mp3"):
-    try:
-        tts = gTTS(text)
-        tts.save(output_file)
-        return output_file
-    except Exception as e:
-        st.error(f"Error during text-to-speech conversion: {e}")
-        return None
-# Streamlit app starts here
-st.title("📄 PDF Discussion Points Generator")
-st.write("Upload a small PDF file to generate discussion points and listen to them.")
 # File uploader
 uploaded_file = st.file_uploader("Upload a PDF", type=["pdf"])
 if uploaded_file:
     # Extract text from uploaded PDF
     with st.spinner("Extracting text from the uploaded PDF..."):
@@ -53,33 +27,35 @@ if uploaded_file:
         # Generate discussion points
         with st.spinner("Generating discussion points..."):
-            discussion_points = generate_discussion_points(pdf_text)
-            if discussion_points:
                 st.write("### Discussion Points")
                 st.text_area("Discussion Points", discussion_points, height=150)
-                # Convert discussion points to audio
-                with st.spinner("Converting discussion points to audio..."):
                     audio_file = text_to_speech(discussion_points)
-                    if audio_file:
-                        st.success("Audio file generated successfully!")
-                        # Audio playback
-                        st.write("### Listen to the Discussion Points")
-                        audio_bytes = open(audio_file, "rb").read()
-                        st.audio(audio_bytes, format="audio/mp3")
-                        # Option to download the audio file
-                        st.download_button(
-                            label="Download Audio",
-                            data=audio_bytes,
-                            file_name="discussion_points.mp3",
-                            mime="audio/mp3"
-                        )
-            else:
-                st.error("Failed to generate discussion points. Please try again.")
     else:
         st.error("No text was extracted from the uploaded PDF. Please try with another file.")
 else:

+# Function to generate discussion points with a prompt
+def generate_discussion_points(text, user_prompt=""):
+    summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
+    # Prepend the user prompt to the text for guided summarization
+    input_text = f"{user_prompt}\n\n{text}"
+    summary = summarizer(input_text, max_length=130, min_length=30, do_sample=False)
+    return summary[0]['summary_text']
+# Streamlit app
+st.title("📄 PDF Discussion Points Generator with User Prompts")
+st.write("Upload a PDF file, provide a prompt for the summary, and listen to the generated discussion points.")
 # File uploader
 uploaded_file = st.file_uploader("Upload a PDF", type=["pdf"])
+# Prompt input
+user_prompt = st.text_input("Enter a specific prompt for the summary (optional):", "")
 if uploaded_file:
     # Extract text from uploaded PDF
     with st.spinner("Extracting text from the uploaded PDF..."):
         # Generate discussion points
         with st.spinner("Generating discussion points..."):
+            try:
+                discussion_points = generate_discussion_points(pdf_text, user_prompt)
                 st.write("### Discussion Points")
                 st.text_area("Discussion Points", discussion_points, height=150)
+            except Exception as e:
+                st.error(f"Error during summarization: {e}")
+            # Convert discussion points to audio
+            with st.spinner("Converting discussion points to audio..."):
+                try:
                     audio_file = text_to_speech(discussion_points)
+                    st.success("Audio file generated successfully!")
+                except Exception as e:
+                    st.error(f"Error during text-to-speech conversion: {e}")
+                    audio_file = None
+            if audio_file:
+                # Audio playback
+                st.write("### Listen to the Discussion Points")
+                audio_bytes = open(audio_file, "rb").read()
+                st.audio(audio_bytes, format="audio/mp3")
+                # Option to download the audio file
+                st.download_button(
+                    label="Download Audio",
+                    data=audio_bytes,
+                    file_name="discussion_points.mp3",
+                    mime="audio/mp3"
+                )
     else:
         st.error("No text was extracted from the uploaded PDF. Please try with another file.")
 else: