AP_AGENT

Sleeping

App Files Files Community

Seth0330 commited on Jun 17, 2025

Commit

1108365

verified ·

1 Parent(s): dc0c728

Update app.py

Browse files

Files changed (1) hide show

app.py +81 -13

app.py CHANGED Viewed

@@ -246,28 +246,94 @@ def find_best_po_match(inv, po_df):
         po_unit = str(row.get("Item Unit Price", ""))
         po_line_total = clean_num(row.get("Line Item Total", ""))
-        # Weighted fuzzy scores
         s_supplier = weighted_fuzzy_score(inv_supplier, po_supplier)
         s_ship_to = weighted_fuzzy_score(inv_ship_to, po_ship_to)
         s_bill_to = weighted_fuzzy_score(inv_bill_to, po_bill_to)
         s_terms = weighted_fuzzy_score(inv_payment_terms, po_payment_terms)
         s_currency = weighted_fuzzy_score(inv_currency, po_currency)
         s_total = 100 if inv_total_due is not None and po_total is not None and abs(inv_total_due - po_total) < 2 else 0
         # Check for at least one line item strong match
         line_item_score = 0
         line_reason = ""
         for line in inv_line_items:
             desc_score = weighted_fuzzy_score(line.get("description", ""), po_desc)
             qty_score = 100 if clean_num(line.get("quantity")) == clean_num(po_qty) else 0
             unit_score = 100 if clean_num(line.get("price")) == clean_num(po_unit) else 0
             amount_score = 100 if clean_num(line.get("amount")) == po_line_total else 0
             total = desc_score * 0.5 + qty_score * 0.2 + unit_score * 0.15 + amount_score * 0.15
             if total > line_item_score:
                 line_item_score = total
-                line_reason = (f"Best line item: desc_score={desc_score}, qty_score={qty_score}, "
-                               f"unit_score={unit_score}, amount_score={amount_score}")
-        # Score weights (tune as needed)
         total_score = (
             s_supplier * 0.25 +
             s_ship_to * 0.1 +
@@ -277,25 +343,26 @@ def find_best_po_match(inv, po_df):
             s_total * 0.2 +
             line_item_score * 0.2
         )
         reason = (
-            f"Supplier match: {s_supplier}/100, Ship To: {s_ship_to}/100, "
-            f"Bill To: {s_bill_to}/100, Payment Terms: {s_terms}/100, Currency: {s_currency}/100, "
-            f"Total Due: {'match' if s_total else 'no match'}, "
             f"Line item best match: {int(line_item_score)}/100. {line_reason}"
         )
         debug = {
             "po_idx": idx,
             "po_supplier": po_supplier,
             "po_ship_to": po_ship_to,
             "po_bill_to": po_bill_to,
             "po_total": po_total,
-            "s_supplier": s_supplier,
-            "s_ship_to": s_ship_to,
-            "s_bill_to": s_bill_to,
-            "s_terms": s_terms,
-            "s_currency": s_currency,
-            "s_total": s_total,
             "line_item_score": line_item_score,
             "total_score": total_score,
             "line_reason": line_reason,
             "inv_total_due": inv_total_due
@@ -309,6 +376,7 @@ def find_best_po_match(inv, po_df):
     best_row, best_score, reason, debug = scores[0]
     return best_row, best_score, reason, debug
 def extract_invoice_info(model_choice, text):
     prompt = get_extraction_prompt(model_choice, text)
     raw = query_llm(model_choice, prompt)

         po_unit = str(row.get("Item Unit Price", ""))
         po_line_total = clean_num(row.get("Line Item Total", ""))
+        field_details = []
         s_supplier = weighted_fuzzy_score(inv_supplier, po_supplier)
+        field_details.append({
+            "field": "Supplier Name",
+            "invoice": inv_supplier,
+            "po": po_supplier,
+            "score": s_supplier
+        })
         s_ship_to = weighted_fuzzy_score(inv_ship_to, po_ship_to)
+        field_details.append({
+            "field": "Ship To",
+            "invoice": inv_ship_to,
+            "po": po_ship_to,
+            "score": s_ship_to
+        })
         s_bill_to = weighted_fuzzy_score(inv_bill_to, po_bill_to)
+        field_details.append({
+            "field": "Bill To",
+            "invoice": inv_bill_to,
+            "po": po_bill_to,
+            "score": s_bill_to
+        })
         s_terms = weighted_fuzzy_score(inv_payment_terms, po_payment_terms)
+        field_details.append({
+            "field": "Payment Terms",
+            "invoice": inv_payment_terms,
+            "po": po_payment_terms,
+            "score": s_terms
+        })
         s_currency = weighted_fuzzy_score(inv_currency, po_currency)
+        field_details.append({
+            "field": "Currency",
+            "invoice": inv_currency,
+            "po": po_currency,
+            "score": s_currency
+        })
         s_total = 100 if inv_total_due is not None and po_total is not None and abs(inv_total_due - po_total) < 2 else 0
+        field_details.append({
+            "field": "Total Due",
+            "invoice": inv_total_due,
+            "po": po_total,
+            "score": s_total
+        })
         # Check for at least one line item strong match
         line_item_score = 0
         line_reason = ""
+        best_line_detail = None
         for line in inv_line_items:
             desc_score = weighted_fuzzy_score(line.get("description", ""), po_desc)
             qty_score = 100 if clean_num(line.get("quantity")) == clean_num(po_qty) else 0
             unit_score = 100 if clean_num(line.get("price")) == clean_num(po_unit) else 0
             amount_score = 100 if clean_num(line.get("amount")) == po_line_total else 0
             total = desc_score * 0.5 + qty_score * 0.2 + unit_score * 0.15 + amount_score * 0.15
+            detail = {
+                "field": "Line Item",
+                "invoice": {
+                    "description": line.get("description", ""),
+                    "quantity": line.get("quantity", ""),
+                    "price": line.get("price", ""),
+                    "amount": line.get("amount", ""),
+                },
+                "po": {
+                    "description": po_desc,
+                    "quantity": po_qty,
+                    "price": po_unit,
+                    "amount": po_line_total,
+                },
+                "desc_score": desc_score,
+                "qty_score": qty_score,
+                "unit_score": unit_score,
+                "amount_score": amount_score,
+                "line_item_score": total
+            }
             if total > line_item_score:
                 line_item_score = total
+                best_line_detail = detail
+                line_reason = (
+                    f"Best line item: desc_score={desc_score}, qty_score={qty_score}, "
+                    f"unit_score={unit_score}, amount_score={amount_score}"
+                )
         total_score = (
             s_supplier * 0.25 +
             s_ship_to * 0.1 +
             s_total * 0.2 +
             line_item_score * 0.2
         )
         reason = (
+            f"Supplier match: {s_supplier}/100 (invoice: '{inv_supplier}' vs PO: '{po_supplier}'), "
+            f"Ship To: {s_ship_to}/100 (invoice: '{inv_ship_to}' vs PO: '{po_ship_to}'), "
+            f"Bill To: {s_bill_to}/100 (invoice: '{inv_bill_to}' vs PO: '{po_bill_to}'), "
+            f"Payment Terms: {s_terms}/100 (invoice: '{inv_payment_terms}' vs PO: '{po_payment_terms}'), "
+            f"Currency: {s_currency}/100 (invoice: '{inv_currency}' vs PO: '{po_currency}'), "
+            f"Total Due: {'match' if s_total else 'no match'} (invoice: {inv_total_due} vs PO: {po_total}), "
             f"Line item best match: {int(line_item_score)}/100. {line_reason}"
         )
         debug = {
             "po_idx": idx,
             "po_supplier": po_supplier,
             "po_ship_to": po_ship_to,
             "po_bill_to": po_bill_to,
             "po_total": po_total,
+            "scores": field_details,
             "line_item_score": line_item_score,
+            "best_line_detail": best_line_detail,
             "total_score": total_score,
             "line_reason": line_reason,
             "inv_total_due": inv_total_due
     best_row, best_score, reason, debug = scores[0]
     return best_row, best_score, reason, debug
 def extract_invoice_info(model_choice, text):
     prompt = get_extraction_prompt(model_choice, text)
     raw = query_llm(model_choice, prompt)