Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -10,14 +10,6 @@ import tempfile
|
|
| 10 |
import shutil
|
| 11 |
import spaces
|
| 12 |
|
| 13 |
-
# Define paths
|
| 14 |
-
pdf_path = './resources/uploaded_pdf.pdf'
|
| 15 |
-
clean_text_path = './resources/clean_text.txt'
|
| 16 |
-
transcript_path = './resources/data.pkl'
|
| 17 |
-
tts_ready_path = './resources/podcast_ready_data.pkl'
|
| 18 |
-
audio_output_path = 'final_podcast_audio.mp3'
|
| 19 |
-
|
| 20 |
-
|
| 21 |
|
| 22 |
def create_temp_session_directory():
|
| 23 |
return tempfile.mkdtemp()
|
|
@@ -38,7 +30,7 @@ def process_pdf_to_podcast(pdf_file):
|
|
| 38 |
# Step 1: Extract Text from PDF
|
| 39 |
shutil.copy(pdf_file, pdf_path)
|
| 40 |
|
| 41 |
-
extractor = PDFTextExtractor(pdf_path)
|
| 42 |
clean_text_path = extractor.clean_and_save_text()
|
| 43 |
|
| 44 |
# Display a preview of extracted text
|
|
|
|
| 10 |
import shutil
|
| 11 |
import spaces
|
| 12 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 13 |
|
| 14 |
def create_temp_session_directory():
|
| 15 |
return tempfile.mkdtemp()
|
|
|
|
| 30 |
# Step 1: Extract Text from PDF
|
| 31 |
shutil.copy(pdf_file, pdf_path)
|
| 32 |
|
| 33 |
+
extractor = PDFTextExtractor(pdf_path,clean_text_path)
|
| 34 |
clean_text_path = extractor.clean_and_save_text()
|
| 35 |
|
| 36 |
# Display a preview of extracted text
|