Spaces:

tensorlake
/

document-extractors

Sleeping

rishiraj commited on Jun 7, 2024

Commit

cf23322

verified ·

1 Parent(s): c6e6f88

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,7 +23,7 @@ def use_marker(pdf_filepath):
 	config = MarkdownExtractorConfig(batch_multiplier=2)
 	result = markdown_extractor.extract(content, config)
-	return result
 @spaces.GPU
 def use_pdf_extractor(pdf_filepath):
@@ -37,9 +37,8 @@ def use_pdf_extractor(pdf_filepath):
 	config = PDFExtractorConfig(output_types=["text", "table"])
 	result = pdf_extractor.extract(content, config)
-	return result
-@spaces.GPU
 def use_gemini(pdf_filepath, key):
 	if pdf_filepath is None:
 		raise gr.Error("Please provide some input PDF: upload an PDF file")
@@ -51,9 +50,8 @@ def use_gemini(pdf_filepath, key):
 	config = GeminiExtractorConfig(prompt="Extract all text from the document.", model_name="gemini-1.5-flash", key=key)
 	result = gemini_extractor.extract(content, config)
-	return result
-@spaces.GPU
 def use_openai(pdf_filepath, key):
 	if pdf_filepath is None:
 		raise gr.Error("Please provide some input PDF: upload an PDF file")
@@ -65,7 +63,7 @@ def use_openai(pdf_filepath, key):
 	config = OAIExtractorConfig(prompt="Extract all text from the document.", model_name="gpt-4o", key=key)
 	result = oai_extractor.extract(content, config)
-	return result
 with gr.Blocks(title="PDF data extraction with Marker & Indexify") as marker_demo:
 	gr.HTML("<h1 style='text-align: center'>PDF data extraction with Marker & <a href='https://getindexify.ai/'>Indexify</a></h1>")

 	config = MarkdownExtractorConfig(batch_multiplier=2)
 	result = markdown_extractor.extract(content, config)
+	return str(result)
 @spaces.GPU
 def use_pdf_extractor(pdf_filepath):
 	config = PDFExtractorConfig(output_types=["text", "table"])
 	result = pdf_extractor.extract(content, config)
+	return str(result)
 def use_gemini(pdf_filepath, key):
 	if pdf_filepath is None:
 		raise gr.Error("Please provide some input PDF: upload an PDF file")
 	config = GeminiExtractorConfig(prompt="Extract all text from the document.", model_name="gemini-1.5-flash", key=key)
 	result = gemini_extractor.extract(content, config)
+	return str(result)
 def use_openai(pdf_filepath, key):
 	if pdf_filepath is None:
 		raise gr.Error("Please provide some input PDF: upload an PDF file")
 	config = OAIExtractorConfig(prompt="Extract all text from the document.", model_name="gpt-4o", key=key)
 	result = oai_extractor.extract(content, config)
+	return str(result)
 with gr.Blocks(title="PDF data extraction with Marker & Indexify") as marker_demo:
 	gr.HTML("<h1 style='text-align: center'>PDF data extraction with Marker & <a href='https://getindexify.ai/'>Indexify</a></h1>")