Spaces:

Sbboss
/

FinAIAgent

Sleeping

App Files Files Community

FinAIAgent / agent /utils.py

Sbboss

Initial commit

4a86b49 5 months ago

raw

history blame contribute delete

8.31 kB

	import pandas as pd
	import numpy as np
	import matplotlib.pyplot as plt

	# Load and prepare data
	dfs = pd.read_excel("data.xlsx", sheet_name=None)
	actuals = dfs["actuals"].copy()
	budget = dfs["budget"].copy()
	cash = dfs["cash"].copy()
	fx = dfs["fx"].copy()

	# Normalize month columns
	for df in (actuals, budget, cash, fx):
	df["month"] = pd.to_datetime(df["month"]).dt.to_period("M")

	# Helper: convert any DataFrame with `amount` & `currency` to USD
	def convert_to_usd(df: pd.DataFrame, fx: pd.DataFrame) -> pd.DataFrame:
	merged = df.merge(
	fx,
	on=["month", "currency"],
	how="left",
	suffixes=("", "_fx"),
	)
	merged["rate_to_usd"] = merged["rate_to_usd"].fillna(1.0)
	merged["amount_usd"] = merged["amount"] * merged["rate_to_usd"]
	return merged

	# 1. Revenue variance
	def revenue_variance(start_month: str, end_month: str) -> float:
	a = convert_to_usd(actuals, fx)
	b = convert_to_usd(budget, fx)
	mask = lambda df: (df["month"] >= pd.Period(start_month)) & (df["month"] <= pd.Period(end_month))
	actual_rev = a[mask(a) & (a["account_category"] == "Revenue")]["amount_usd"].sum()
	budget_rev = b[mask(b) & (b["account_category"] == "Revenue")]["amount_usd"].sum()
	return actual_rev - budget_rev, actual_rev, budget_rev

	# 2. Gross Margin %
	def gross_margin_pct(start_month: str, end_month: str) -> float:
	a = convert_to_usd(actuals, fx)
	mask = (a["month"] >= pd.Period(start_month)) & (a["month"] <= pd.Period(end_month))

	result = {}
	for m in sorted(a[mask]["month"].unique()):
	sub = a[a["month"] == m]
	rev = sub[sub["account_category"] == "Revenue"]["amount_usd"].sum()
	cogs = sub[sub["account_category"] == "COGS"]["amount_usd"].sum()
	result[str(m)] = round((rev - cogs) / rev * 100, 2) if rev != 0 else 0.0

	return result

	# 3. Opex breakdown
	def opex_breakdown(start_month: str, end_month: str) -> dict:
	a = convert_to_usd(actuals, fx)
	mask = (a["month"] >= pd.Period(start_month)) & (a["month"] <= pd.Period(end_month))
	opex = a[mask & a["account_category"].str.startswith("Opex")]
	return opex.groupby("account_category")["amount_usd"].sum().to_dict()

	# 4. EBITDA proxy
	def ebitda_proxy(start_month: str, end_month: str) -> float:
	a = convert_to_usd(actuals, fx)
	mask = (a["month"] >= pd.Period(start_month)) & (a["month"] <= pd.Period(end_month))
	rev = a[mask & (a["account_category"] == "Revenue")]["amount_usd"].sum()
	cogs = a[mask & (a["account_category"] == "COGS")]["amount_usd"].sum()
	opex = a[mask & a["account_category"].str.startswith("Opex")]["amount_usd"].sum()
	return rev - cogs - opex

	# 5. Cash runway
	def cash_runway(as_of_month: str = None, last_n_months: int = 3) -> float:
	# If no as_of_month specified, use most recent
	if as_of_month is None:
	most_recent = cash["month"].max()
	else:
	most_recent = pd.Period(as_of_month)

	# Get cash balance as of the specified/most recent month
	cash_usd = cash[cash["month"] == most_recent]["cash_usd"].sum()

	# Calculate net burn for each of the last N months before as_of_month
	a = convert_to_usd(actuals, fx)

	# Get months ending before as_of_month
	available_months = sorted([m for m in a["month"].unique() if m < most_recent])
	months = available_months[-last_n_months:] if len(available_months) >= last_n_months else available_months

	burns = []
	for m in months:
	dfm = a[a["month"] == m]
	rev = dfm[dfm["account_category"] == "Revenue"]["amount_usd"].sum()
	cogs = dfm[dfm["account_category"] == "COGS"]["amount_usd"].sum()
	opex = dfm[dfm["account_category"].str.startswith("Opex")]["amount_usd"].sum()
	burns.append(cogs + opex - rev)

	avg_burn = sum(burns) / len(burns) if burns else 0
	return cash_usd / avg_burn if avg_burn > 0 else float('inf'), avg_burn

	def plot_chart(
	chart_type: str,
	x,
	y,
	title: str,
	x_label: str,
	y_label: str,
	output_path: str,
	legends: list[str] \| None = None, # ← NEW
	) -> str:
	"""
	Plot helper that supports single-series and multi-series
	bar, line, scatter and pie charts.

	Parameters
	----------
	chart_type : {"bar", "line", "scatter", "pie"}
	x, y : list-like objects. For multi-series data,
	use y = [[series1], [series2], …] and
	x = [[categories]].
	legends : Optional list of legend labels, one per series.
	"""
	try:

	plt.figure(figsize=(7, 4))

	# ── MULTI-SERIES ────────────────────────────────────────────────
	if isinstance(y[0], list) and len(y) > 1:
	categories = x[0] # shared x-axis
	n_groups = len(categories)
	n_series = len(y)

	if chart_type == "bar":
	bar_width = 0.8 / n_series
	x_pos = np.arange(n_groups)
	colors = ['#1f77b4', '#ff7f0e', '#2ca02c',
	'#d62728', '#9467bd']

	for i, series in enumerate(y):
	offset = (i - n_series / 2 + 0.5) * bar_width
	plt.bar(
	x_pos + offset,
	series,
	bar_width,
	color=colors[i % len(colors)],
	label=(legends[i] if legends and i < len(legends)
	else f"Series {i + 1}")
	)

	plt.xticks(x_pos, categories, rotation=45)
	plt.legend()

	elif chart_type == "line":
	for i, series in enumerate(y):
	plt.plot(
	categories,
	series,
	marker="o",
	label=(legends[i] if legends and i < len(legends)
	else f"Series {i + 1}")
	)
	plt.legend()
	plt.xticks(rotation=45)

	# ── SINGLE-SERIES ───────────────────────────────────────────────
	else:
	# flatten if wrapped
	if isinstance(y[0], list): y = y[0]
	if isinstance(x[0], list): x = x[0]

	if chart_type == "line":
	plt.plot(x, y, marker="o", linewidth=2, markersize=6,
	label=legends[0] if legends else None)
	elif chart_type == "bar":
	plt.bar(x, y, color="skyblue", edgecolor="navy", alpha=0.7,
	label=legends[0] if legends else None)
	plt.xticks(rotation=45)
	plt.ylim(bottom=0)
	elif chart_type == "scatter":
	plt.scatter(x, y, s=60, alpha=0.7,
	label=legends[0] if legends else None)
	elif chart_type == "pie":
	plt.pie(y, labels=x, autopct="%1.1f%%", startangle=90)
	plt.axis("equal")

	if legends and chart_type != "pie":
	plt.legend()

	# ── COMMON FORMATTING ──────────────────────────────────────────
	plt.title(title, fontsize=14, fontweight="bold")

	if chart_type != "pie":
	plt.xlabel(x_label, fontsize=12)
	plt.ylabel(y_label, fontsize=12)
	plt.grid(True, alpha=0.3)

	plt.tight_layout()
	plt.savefig(output_path, dpi=100, bbox_inches="tight")
	plt.close()
	return output_path

	except Exception as e:
	return f'There is some problem with the data you send, I am using matplotlib to plot. Can you send a full code to other tool which could run on PythonREPLTool (should save the graph and return the filename). Here is the error: {e}'
	# return f'There is some problem with the data you send, I am using matplotlib to plot. Can you recheck the data and send it again. May be just include the most important field to plot. Here is the error: {e}'