Money-Manager / app.py
spacedout-bits's picture
Add Personal Finance Manager with HF Hub CSV storage
af365fe
import gradio as gr
import pandas as pd
import json
from datetime import datetime
from typing import Tuple, Dict, Any
import os
import logging
try:
from langchain.llms import HuggingFaceHub
from langchain.prompts import PromptTemplate
from langchain.chains import LLMChain
except ImportError:
# Fallback: try OpenAI or basic mock
pass
from hf_storage import HFHubLedger
# Setup logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
class ExpenseManager:
"""Manages ledger entries and DataFrame operations."""
def __init__(self):
"""Initialize the expense manager with an empty DataFrame."""
self.df = pd.DataFrame(
columns=["Date", "Description", "Category", "Amount"]
)
self.df["Date"] = pd.to_datetime(self.df["Date"])
self.df["Amount"] = pd.to_numeric(self.df["Amount"])
def add_entry(self, date: str, description: str, category: str, amount: float) -> bool:
"""Add a new expense entry to the ledger."""
try:
new_entry = pd.DataFrame({
"Date": [pd.to_datetime(date)],
"Description": [description],
"Category": [category],
"Amount": [float(amount)]
})
self.df = pd.concat([self.df, new_entry], ignore_index=True)
self.df = self.df.sort_values("Date", ascending=False).reset_index(drop=True)
return True
except Exception as e:
print(f"Error adding entry: {e}")
return False
def get_dataframe(self) -> pd.DataFrame:
"""Return the current DataFrame."""
return self.df.copy()
def get_total_spending(self) -> float:
"""Calculate and return total spending."""
if self.df.empty:
return 0.0
return self.df["Amount"].sum()
def get_category_summary(self) -> Dict[str, float]:
"""Get spending summary by category."""
if self.df.empty:
return {}
return self.df.groupby("Category")["Amount"].sum().to_dict()
def initialize_llm():
"""Initialize the LLM. Supports HuggingFace or OpenAI."""
try:
# Try HuggingFace
api_token = os.getenv("HUGGINGFACEHUB_API_TOKEN")
if api_token:
llm = HuggingFaceHub(
repo_id="mistralai/Mistral-7B-Instruct-v0.2",
huggingfacehub_api_token=api_token,
model_kwargs={"temperature": 0.1, "max_length": 200}
)
return llm
except Exception as e:
print(f"HuggingFace initialization failed: {e}")
try:
# Fallback to OpenAI
from langchain.llms import OpenAI
api_key = os.getenv("OPENAI_API_KEY")
if api_key:
return OpenAI(temperature=0.1, max_tokens=200)
except Exception as e:
print(f"OpenAI initialization failed: {e}")
return None
def parse_expense_with_llm(user_input: str, llm) -> Dict[str, Any]:
"""
Parse natural language input into structured expense data using LLM.
Returns a dictionary with keys: date, description, category, amount
"""
if not llm:
return parse_expense_fallback(user_input)
prompt_template = PromptTemplate(
input_variables=["user_input"],
template="""Parse the following expense entry and extract the information into a JSON object.
User input: {user_input}
Return ONLY a valid JSON object with these fields (use today's date if not specified):
- date (YYYY-MM-DD format)
- description (what was purchased)
- category (e.g., Food, Transportation, Utilities, Entertainment, Other)
- amount (numeric value without currency symbol)
JSON:"""
)
chain = LLMChain(llm=llm, prompt=prompt_template)
response = chain.run(user_input=user_input)
try:
# Extract JSON from response
json_str = response.strip()
# Find JSON object in response
start_idx = json_str.find("{")
end_idx = json_str.rfind("}") + 1
if start_idx != -1 and end_idx > start_idx:
json_str = json_str[start_idx:end_idx]
parsed = json.loads(json_str)
return parsed
except json.JSONDecodeError as e:
print(f"JSON parsing error: {e}")
return parse_expense_fallback(user_input)
def parse_expense_fallback(user_input: str) -> Dict[str, Any]:
"""
Fallback parser using regex and heuristics when LLM is unavailable.
"""
import re
result = {
"date": datetime.now().strftime("%Y-%m-%d"),
"description": user_input,
"category": "Other",
"amount": 0.0
}
# Try to extract amount
amount_pattern = r"\$?(\d+(?:\.\d{2})?)"
amount_match = re.search(amount_pattern, user_input)
if amount_match:
result["amount"] = float(amount_match.group(1))
# Simple category detection
categories = {
"Food": ["food", "lunch", "dinner", "breakfast", "coffee", "restaurant", "burrito", "pizza", "eat"],
"Transportation": ["gas", "uber", "lyft", "taxi", "bus", "train", "parking", "car"],
"Utilities": ["electric", "water", "gas", "internet", "phone", "utility"],
"Entertainment": ["movie", "concert", "game", "book", "music"],
"Rent": ["rent", "apartment", "mortgage"],
}
user_lower = user_input.lower()
for category, keywords in categories.items():
if any(keyword in user_lower for keyword in keywords):
result["category"] = category
break
return result
def process_expense_entry(
user_input: str,
manager: ExpenseManager,
llm,
hf_ledger: HFHubLedger = None
) -> Tuple[pd.DataFrame, str, str]:
"""
Process user input, parse it, add to ledger, and return updated table.
"""
if not user_input.strip():
return manager.get_dataframe(), "", "Please enter an expense description."
try:
# Parse the expense
parsed = parse_expense_with_llm(user_input, llm)
# Validate parsed data
if not parsed.get("amount") or parsed["amount"] <= 0:
return manager.get_dataframe(), "", "โŒ Error: Could not extract valid amount. Try again."
# Add to ledger
success = manager.add_entry(
date=parsed.get("date", datetime.now().strftime("%Y-%m-%d")),
description=parsed.get("description", user_input),
category=parsed.get("category", "Other"),
amount=float(parsed["amount"])
)
if success:
# Sync to HF Hub if enabled
if hf_ledger:
hf_ledger.save(manager.df)
total = manager.get_total_spending()
message = f"โœ… Logged: ${parsed['amount']:.2f} - {parsed['description']}"
return manager.get_dataframe(), "", message
else:
return manager.get_dataframe(), "", "โŒ Error adding entry. Please try again."
except Exception as e:
return manager.get_dataframe(), "", f"โŒ Error: {str(e)}"
def build_interface(manager, llm, hf_ledger: HFHubLedger):
"""Build the Gradio interface."""
def log_expense_callback(user_input: str) -> Tuple[pd.DataFrame, str, str]:
"""Callback for log expense button."""
df, cleared_input, message = process_expense_entry(user_input, manager, llm, hf_ledger)
total = manager.get_total_spending()
total_md = f"### ๐Ÿ’ฐ Total Spending: ${total:.2f}"
return df, cleared_input, message, total_md
with gr.Blocks(theme=gr.themes.Soft()) as demo:
gr.Markdown("# ๐Ÿ’ธ Personal Finance Manager")
gr.Markdown("Log your expenses using natural language. The AI will parse and categorize them for you.")
gr.Markdown(f"**Storage Status:** {hf_ledger.get_status()}")
with gr.Row():
with gr.Column(scale=3):
user_input = gr.Textbox(
label="Describe your expense",
placeholder="e.g., 'Spent $15 on a burrito at Chipotle' or 'Paid $1200 for rent'",
lines=2
)
with gr.Column(scale=1):
log_button = gr.Button("Log Expense", variant="primary", scale=1)
status_output = gr.Textbox(
label="Status",
interactive=False,
max_lines=1
)
total_display = gr.Markdown("### ๐Ÿ’ฐ Total Spending: $0.00")
gr.Markdown("## ๐Ÿ“Š Ledger")
ledger_table = gr.Dataframe(
value=manager.get_dataframe(),
interactive=False,
label="Expense Entries",
datatype=["str", "str", "str", "number"],
)
# Connect button click to callback
log_button.click(
fn=log_expense_callback,
inputs=[user_input],
outputs=[ledger_table, user_input, status_output, total_display]
)
# Allow Enter key to submit
user_input.submit(
fn=log_expense_callback,
inputs=[user_input],
outputs=[ledger_table, user_input, status_output, total_display]
)
return demo
def main():
"""Main entry point."""
# Initialize HuggingFace Hub ledger
hf_ledger = HFHubLedger()
# Initialize components
manager = ExpenseManager()
# Load existing data from HF Hub if available
if hf_ledger.df is not None and not hf_ledger.df.empty:
manager.df = hf_ledger.df.copy()
logger.info(f"Loaded {len(manager.df)} entries from persistent storage")
llm = initialize_llm()
if not llm:
logger.warning("โš ๏ธ Warning: LLM not available. Using fallback parser.")
# Build and launch interface
demo = build_interface(manager, llm, hf_ledger)
demo.launch(share=False)
if __name__ == "__main__":
main()