import streamlit as st from PIL import Image import numpy as np import io import pandas as pd import subprocess import sys # List of required packages required_packages = [ "transformers", "ultralytics", "opencv-python-headless", "tqdm", "torch", "torchvision", "easyocr" ] # Function to install packages def install_packages(packages): for package in packages: try: __import__(package.split("==")[0]) # Check if the package is already installed except ImportError: print(f"Installing {package}...") subprocess.check_call([sys.executable, "-m", "pip", "install", package]) # Install required packages install_packages(required_packages) # Import your models and utility functions from TD import TD_model1 from tsr import TSR, get_cell_coordinates_by_row, apply_ocr from info_det_ocr import info_det_and_ocr from Tr_ocr import apply_TRocr # Set page config st.set_page_config( page_title="INDRA OCR", page_icon="🧾", layout="wide", ) # Customizing background color and font color st.markdown(""" """, unsafe_allow_html=True) # App Header st.markdown( """

INDRA OCR: Intelligent Invoice Data Recognition and Automation

""", unsafe_allow_html=True, ) # Create two columns for layout: one for the file uploader and another for the image and extracted data col1, col2 = st.columns([1, 3]) # Adjust the ratio to control the width of the columns with col1: # File uploader for image (placed in the left column, smaller button) uploaded_file = st.file_uploader( "Upload Your Invoice (JPG, JPEG, PNG):", type=["jpg", "jpeg", "png"], label_visibility="collapsed" ) with col2: # Display the uploaded image (right column) if uploaded_file is not None: # If a new image is uploaded, reset the session state if 'uploaded_image' not in st.session_state or st.session_state.uploaded_image != uploaded_file: st.session_state.uploaded_image = uploaded_file st.session_state.processed_data = None st.session_state.cropped_image = None st.session_state.cell_coordinates = None st.session_state.df = None # Process the image only if it hasn't been processed yet if st.session_state.processed_data is None: # Read the image file as a PIL image image = Image.open(uploaded_file) # Resize the image to make it smaller for display image.thumbnail((800, 800)) # Resize to fit within the 800px limit # Convert the image to OpenCV format (NumPy array) image_arr = np.array(image) # Display the uploaded image st.image(image, caption="Uploaded Image", width= 500) # Run info detection and OCR detected_data = info_det_and_ocr(image_arr) st.session_state.processed_data = detected_data # Run the Table detection model and crop images cropped_image = TD_model1(image_arr) if isinstance(cropped_image, list): cropped_image = cropped_image[0] # Extract the image from the list st.session_state.cropped_image = cropped_image # Run Table Structure Recognition (TSR) output_image, cells = TSR(cropped_image) # Get cell coordinates and perform OCR on table cells cell_coordinates = get_cell_coordinates_by_row(cells) st.session_state.cell_coordinates = cell_coordinates # Use TR OCR for extracting table data data = apply_TRocr(cropped_image, cell_coordinates) # Store the DataFrame in session state for CSV download st.session_state.df = pd.DataFrame(data) # Show extracted data if the dataframe is available if st.session_state.df is not None: st.markdown("### Extracted Data Table:") st.dataframe(st.session_state.df) # Display the dataframe as a table # Show download button if the data has been processed st.markdown("### Download Extracted Data") # Convert DataFrame to CSV and store in-memory buffer csv_buffer = io.StringIO() st.session_state.df.to_csv(csv_buffer, index=False) # Get the CSV data as bytes csv_data = csv_buffer.getvalue().encode('utf-8') # Create a download button in Streamlit to download the CSV file st.download_button( label="Download CSV", data=csv_data, file_name="extracted_table_data.csv", mime="text/csv", ) # Footer st.markdown( """ """, unsafe_allow_html=True, )