newpd / file_processing.py
Alfasign's picture
Create file_processing.py
ed508fd
raw
history blame contribute delete
485 Bytes
import PyPDF2
def extract_text_from_pdf(pdf_file):
pdf_reader = PyPDF2.PdfFileReader(pdf_file)
num_pages = pdf_reader.numPages
text = ""
for page_num in range(num_pages):
page = pdf_reader.getPage(page_num)
text += page.extract_text()
return text
def process_text_file(text_file):
text_content = text_file.read().decode('utf-8')
# Führe hier die Verarbeitung des Textdokuments durch und gib das Ergebnis zurück
return text_content