Spaces:

ayushsoni155
/

Invoice_IMG_To_JSON

Sleeping

Ayush soni commited on Sep 26, 2025

Commit

e98e646

1 Parent(s): 6034171

app.py fixwd

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,28 +5,28 @@ from llm_processor import load_llm_model, generate_json_from_text
 # Load LLM model on startup
 load_llm_model()
-def process_invoice(file):
-    # Read file bytes
-    image_bytes = file.read()
-    # Step 1: Extract raw text
-    raw_text = extract_text_from_image(image_bytes)
     if not raw_text or "No text detected" in raw_text:
         return raw_text, {"error": "No text could be extracted from the image."}
-    # Step 2: Convert raw text → structured JSON
     json_data = generate_json_from_text(raw_text)
     return raw_text, json_data
 ### Gradio UI
 with gr.Blocks() as demo:
     gr.Markdown("# 🧾 Invoice Processing App")
     gr.Markdown("Upload an invoice image. The app extracts **OCR text** and generates **structured JSON**.")
     with gr.Row():
-        input_file = gr.File(label="Upload Invoice Image", type="file", file_types=[".png", ".jpg", ".jpeg"])
     with gr.Row():
         raw_text_output = gr.Textbox(label="Extracted OCR Text", lines=10)

 # Load LLM model on startup
 load_llm_model()
+def process_invoice(file_bytes):
+    if file_bytes is None:
+        return "No file uploaded", {"error": "No file uploaded"}
+    # Step 1: Extract text
+    raw_text = extract_text_from_image(file_bytes)
     if not raw_text or "No text detected" in raw_text:
         return raw_text, {"error": "No text could be extracted from the image."}
+    # Step 2: JSON generation
     json_data = generate_json_from_text(raw_text)
     return raw_text, json_data
 ### Gradio UI
 with gr.Blocks() as demo:
     gr.Markdown("# 🧾 Invoice Processing App")
     gr.Markdown("Upload an invoice image. The app extracts **OCR text** and generates **structured JSON**.")
     with gr.Row():
+        input_file = gr.File(label="Upload Invoice Image", type="binary", file_types=[".png", ".jpg", ".jpeg"])
     with gr.Row():
         raw_text_output = gr.Textbox(label="Extracted OCR Text", lines=10)