Spaces:

Rivalcoder
/

Pdf-Processing

Sleeping

Pdf-Processing / app.py

Rivalcoder

Add application file

6928eef 7 months ago

762 Bytes

	import fitz # PyMuPDF
	import gradio as gr

	def extract_text_from_pdf(file):
	if file is None:
	return "No file uploaded."

	try:
	doc = fitz.open(file.name) # Use file path directly
	full_text = ""
	for page_num in range(len(doc)):
	page = doc.load_page(page_num)
	text = page.get_text()
	full_text += f"\n\n--- Page {page_num + 1} ---\n\n{text}"
	return full_text
	except Exception as e:
	return f"Error: {str(e)}"

	gr.Interface(
	fn=extract_text_from_pdf,
	inputs=gr.File(label="Upload PDF", file_types=[".pdf"]),
	outputs="text",
	title="PDF to Text Extractor",
	description="Upload a PDF file and get all the extracted text from each page.",
	).launch()