data_set_jee / app.py
Optimus-Prym's picture
Create app.py
90aedff verified
raw
history blame contribute delete
430 Bytes
import fitz # PyMuPDF
import gradio as gr
def extract_text_from_pdf(pdf_file):
doc = fitz.open(stream=pdf_file.read(), filetype="pdf")
text = ""
for page in doc:
text += page.get_text()
return text[:3000] # Show only the first 3000 characters for now
gr.Interface(
fn=extract_text_from_pdf,
inputs=gr.File(file_types=[".pdf"]),
outputs="text",
title="๐Ÿ“„ JEE PDF Extractor"
).launch()