Spaces:

pranavdaware
/

web_ocrgoi_ocr2.0

No application file

App Files Files Community

web_ocrgoi_ocr2.0 / app.py

pranavdaware

Create app.py

026ea7b verified over 1 year ago

raw

history blame contribute delete

2.66 kB

	import gradio as gr
	from transformers import AutoModel, AutoTokenizer
	import os
	import re

	# Load the model and tokenizer from local path
	# Assuming your model and tokenizer are stored in '/content/model' directory in Colab
	model_path = 'pranavdaware/web_ocr'

	# Load the model and tokenizer from the local directory
	tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
	model = AutoModel.from_pretrained(model_path, trust_remote_code=True, low_cpu_mem_usage=True, device_map='cuda', use_safetensors=True)
	model = model.eval().cuda()

	# Function to extract text using OCR
	def ocr_processing(image_file):
	try:
	# Perform OCR on the uploaded image
	result = model.chat(tokenizer, image_file, ocr_type='ocr')
	return result
	except Exception as e:
	return str(e)

	# Function to search for keywords in extracted text
	def search_keyword(ocr_text, keyword):
	try:
	# Use regex to search for the keyword and highlight matches
	matches = re.findall(rf"({keyword})", ocr_text, re.IGNORECASE)
	if matches:
	highlighted_text = re.sub(rf"({keyword})", r'<mark>\1</mark>', ocr_text, flags=re.IGNORECASE)
	return highlighted_text
	else:
	return f"No matches found for '{keyword}' in the extracted text."
	except Exception as e:
	return str(e)

	# Gradio interface
	def main():
	# Gradio app layout
	with gr.Blocks() as demo:
	gr.Markdown("# OCR and Keyword Search Application")

	with gr.Row():
	with gr.Column():
	image_input = gr.Image(type="filepath", label="Upload your image")
	keyword_input = gr.Textbox(label="Enter keyword to search")
	ocr_output = gr.Textbox(label="OCR Output")
	search_output = gr.HTML(label="Search Results")

	# Button for OCR processing
	process_button = gr.Button("Process Image for OCR")

	# Connect the OCR processing function to the button
	process_button.click(
	fn=ocr_processing,
	inputs=image_input,
	outputs=ocr_output
	)

	# Button for keyword search
	search_button = gr.Button("Search Keyword in OCR Text")

	# Connect the search function to the button
	search_button.click(
	fn=search_keyword,
	inputs=[ocr_output, keyword_input],
	outputs=search_output
	)

	# Launch the Gradio demo
	demo.launch()

	if __name__ == "__main__":
	main()