Spaces:

PD03
/

talk_to_data

Sleeping

App Files Files Community

PD03 commited on Jun 26, 2025

Commit

13050f3

verified ·

1 Parent(s): 1c34919

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -32

app.py CHANGED Viewed

@@ -1,53 +1,36 @@
 import gradio as gr
 import pandas as pd
 from transformers import pipeline
-# 1) Load your data
 df = pd.read_csv("synthetic_profit.csv")
 table = df.astype(str).to_dict(orient="records")
-# 2) TAPEX table‐QA pipeline
 qa = pipeline(
     "table-question-answering",
-    model="microsoft/tapex-base-finetuned-wtq",
-    tokenizer="microsoft/tapex-base-finetuned-wtq",
-    device=-1
 )
-# 3) Few‐shot examples
-EXAMPLE_PROMPT = """
-Example 1:
-Q: What is the total revenue for Product A in EMEA in Q1 2024?
-A: Filter Product=A & Region=EMEA & FiscalYear=2024 & FiscalQuarter=Q1, then sum Revenue → 3075162.49
-Example 2:
-Q: What is the total cost for Product A in EMEA in Q1 2024?
-A: Filter Product=A & Region=EMEA & FiscalYear=2024 & FiscalQuarter=Q1, then sum Cost → 2894321.75
-Example 3:
-Q: What is the total margin for Product A in EMEA in Q1 2024?
-A: Filter Product=A & Region=EMEA & FiscalYear=2024 & FiscalQuarter=Q1, then sum ProfitMargin → 0.18
-"""
 def answer_question(question: str) -> str:
-    full_query = EXAMPLE_PROMPT + f"\nQ: {question}\nA:"
     try:
-        result = qa(table=table, query=full_query)
-        return result.get("answer", "No answer found.")
     except Exception as e:
-        # Return the actual exception message so you can debug
-        return f"❌ Pipeline error:\n{e}"
 # 4) Gradio UI
 iface = gr.Interface(
     fn=answer_question,
-    inputs=gr.Textbox(lines=2, placeholder="Ask a basic question…", label="Your question"),
-    outputs=gr.Textbox(lines=6, label="Answer"),
-    title="SAP Profitability Q&A",
-    description=(
-        "Ask simple revenue/cost/margin questions on the synthetic SAP data. "
-        "Powered by microsoft/tapex-base-finetuned-wtq with three few‐shot examples."
-    ),
     allow_flagging="never",
 )

+# app.py
 import gradio as gr
 import pandas as pd
 from transformers import pipeline
+# 1) Load your synthetic SAP data (all as strings so TAPAS never sees floats)
 df = pd.read_csv("synthetic_profit.csv")
 table = df.astype(str).to_dict(orient="records")
+# 2) Instantiate TAPAS fine-tuned on WikiTableQuestions
 qa = pipeline(
     "table-question-answering",
+    model="google/tapas-base-finetuned-wtq",
+    tokenizer="google/tapas-base-finetuned-wtq",
+    device=-1  # CPU; change to 0 if you enable GPU
 )
+# 3) Simple QA function
 def answer_question(question: str) -> str:
     try:
+        out = qa(table=table, query=question)
+        return out.get("answer", "No answer found.")
     except Exception as e:
+        return f"❌ Error: {e}"
 # 4) Gradio UI
 iface = gr.Interface(
     fn=answer_question,
+    inputs=gr.Textbox(lines=2, placeholder="e.g. What is the total revenue for Product A in EMEA in Q1 2024?"),
+    outputs=gr.Textbox(lines=4),
+    title="SAP Profitability Q&A (TAPAS)",
+    description="Ask simple sum/avg questions on your SAP data. Powered by google/tapas-base-finetuned-wtq.",
     allow_flagging="never",
 )