Spaces:

mdAmin313
/

lumen

Sleeping

App Files Files Community

lumen / app.py

mdAmin313

Update app.py

c7f08a7 verified 4 months ago

raw

history blame contribute delete

29.7 kB

	# smc_multimodal_atr_report.py
	"""
	SMC Multimodal + Gemini Auto-label + Batch CSV Prediction with ATR-based SL/TP + HTML report.

	Requirements (example):
	pip install torch torchvision pandas scikit-learn pillow gradio tqdm joblib matplotlib google-generativeai
	Set GENAI_API_KEY environment variable for Gemini if using that tab.
	"""
	import os
	import io
	import zipfile
	import tempfile
	import shutil
	import json
	import base64
	from typing import List, Tuple, Optional
	from datetime import datetime

	import numpy as np
	import pandas as pd
	from PIL import Image
	import joblib
	import matplotlib.pyplot as plt

	import torch
	import torch.nn as nn
	import torch.optim as optim
	from torch.utils.data import Dataset, DataLoader

	from sklearn.preprocessing import StandardScaler
	from sklearn.model_selection import train_test_split

	import gradio as gr

	# --- Gemini client (google-genai) -----------------
	try:
	from google import genai
	except Exception:
	genai = None

	# -------------------------
	# Config
	# -------------------------
	DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	IMAGE_SIZE = 128
	SEQ_LEN = 32
	SEQ_BATCH = 64
	EPOCHS = 8
	MODEL_DIR = "models_smc_multimodal"
	AUTO_DIR = "auto_labeled"
	os.makedirs(MODEL_DIR, exist_ok=True)
	os.makedirs(AUTO_DIR, exist_ok=True)

	LABELS = ["Sell", "Hold", "Buy"]

	# -------------------------
	# Helpers and CSV robustness
	# -------------------------
	COMMON_COLS = {
	"open": ["open", "Open", "O", "o"],
	"high": ["high", "High", "H", "h"],
	"low": ["low", "Low", "L", "l"],
	"close":["close", "Close", "C", "c"],
	"volume":["volume", "Volume", "V", "v"]
	}

	def find_col(df, choices):
	for c in choices:
	if c in df.columns:
	return c
	return None

	def handle_ohlcv_csv(csv_file):
	df = pd.read_csv(csv_file.name)
	col_map = {}
	for key, choices in COMMON_COLS.items():
	found = find_col(df, choices)
	if not found:
	raise ValueError(f"OHLCV CSV missing column for '{key}'. Tried: {choices}")
	col_map[found] = key.capitalize()
	df = df.rename(columns=col_map)
	if "Date" in df.columns:
	try:
	df["Date"] = pd.to_datetime(df["Date"], infer_datetime_format=True)
	except Exception:
	pass
	df = df.sort_values("Date").reset_index(drop=True)
	else:
	df = df.reset_index(drop=True)
	for c in ["Open","High","Low","Close","Volume"]:
	df[c] = pd.to_numeric(df[c], errors="coerce")
	df[["Open","High","Low","Close","Volume"]] = df[["Open","High","Low","Close","Volume"]].fillna(method="ffill").fillna(method="bfill")
	if df[["Open","High","Low","Close","Volume"]].isnull().any().any():
	raise ValueError("OHLCV CSV contains too many missing values after fill.")
	return df

	def label_to_index_generic(l):
	if isinstance(l, str):
	s = l.strip().lower()
	for i, lab in enumerate(LABELS):
	if lab.lower() == s:
	return i
	try:
	idx = int(l)
	if idx in [0,1,2]:
	return idx
	except:
	pass
	raise ValueError(f"Unknown label: {l}")

	# -------------------------
	# Models (same as before)
	# -------------------------
	class MultimodalDataset(Dataset):
	def __init__(self, items: List[Tuple[str, np.ndarray, int]]):
	self.items = items
	def __len__(self): return len(self.items)
	def __getitem__(self, idx):
	img_path, seq_arr, label = self.items[idx]
	img = Image.open(img_path).convert("RGB").resize((IMAGE_SIZE, IMAGE_SIZE))
	img_arr = (np.array(img).astype(np.float32) / 255.0)
	img_arr = np.transpose(img_arr, (2,0,1))
	img_tensor = torch.tensor(img_arr, dtype=torch.float32)
	seq_tensor = torch.tensor(seq_arr.astype(np.float32))
	label_tensor = torch.tensor(int(label), dtype=torch.long)
	return img_tensor, seq_tensor, label_tensor

	class SimpleCNNEmbedding(nn.Module):
	def __init__(self, emb_size=128):
	super().__init__()
	self.conv = nn.Sequential(
	nn.Conv2d(3, 16, 3, padding=1), nn.ReLU(), nn.MaxPool2d(2),
	nn.Conv2d(16, 32, 3, padding=1), nn.ReLU(), nn.MaxPool2d(2),
	nn.Conv2d(32, 64, 3, padding=1), nn.ReLU(), nn.MaxPool2d(2),
	)
	conv_out = (IMAGE_SIZE // 8) * (IMAGE_SIZE // 8) * 64
	self.head = nn.Sequential(nn.Flatten(), nn.Linear(conv_out, emb_size), nn.ReLU())
	def forward(self, x): return self.head(self.conv(x))

	class SimpleLSTMEmbedding(nn.Module):
	def __init__(self, n_features, hidden=64, emb_size=128):
	super().__init__()
	self.lstm = nn.LSTM(input_size=n_features, hidden_size=hidden, num_layers=1, batch_first=True, bidirectional=True)
	self.proj = nn.Sequential(nn.Linear(hidden*2, emb_size), nn.ReLU())
	def forward(self, x):
	out, _ = self.lstm(x)
	last = out[:, -1, :]
	return self.proj(last)

	class MultimodalNet(nn.Module):
	def __init__(self, n_features, emb_size=128, n_classes=3):
	super().__init__()
	self.img_model = SimpleCNNEmbedding(emb_size=emb_size)
	self.seq_model = SimpleLSTMEmbedding(n_features=n_features, hidden=64, emb_size=emb_size)
	self.head = nn.Sequential(nn.Linear(emb_size*2, 256), nn.ReLU(), nn.Dropout(0.2), nn.Linear(256, n_classes))
	def forward(self, img, seq):
	img_emb = self.img_model(img)
	seq_emb = self.seq_model(seq)
	cat = torch.cat([img_emb, seq_emb], dim=1)
	return self.head(cat)

	# -------------------------
	# Helper: ATR
	# -------------------------
	def compute_atr(df: pd.DataFrame, n=14):
	high = df["High"].values
	low = df["Low"].values
	close = df["Close"].values
	tr = np.maximum(high - low, np.maximum(np.abs(high - np.concatenate(([close[0]], close[:-1]))), np.abs(low - np.concatenate(([close[0]], close[:-1])))))
	# first TR uses high-low
	atr = pd.Series(tr).rolling(window=n, min_periods=1).mean().values
	return atr # numpy array length n_rows

	# -------------------------
	# Load & predict (single)
	# -------------------------
	def load_multimodal_model():
	path = os.path.join(MODEL_DIR, "multimodal_model.pt")
	if not os.path.exists(path):
	return None
	ckpt = torch.load(path, map_location=DEVICE)
	n_features = ckpt.get("n_features")
	model = MultimodalNet(n_features=n_features, emb_size=128, n_classes=len(LABELS)).to(DEVICE)
	model.load_state_dict(ckpt["model_state"])
	model.eval()
	return model

	def predict_multimodal(image_bytes, csv_snippet_file, scaler_path=os.path.join(MODEL_DIR,"csv_scaler.pkl")):
	model = load_multimodal_model()
	if model is None:
	return "No trained multimodal model found.", None
	if not os.path.exists(scaler_path):
	return "CSV scaler not found. Train first.", None
	img = Image.open(io.BytesIO(image_bytes)).convert("RGB").resize((IMAGE_SIZE, IMAGE_SIZE))
	img_arr = (np.array(img).astype(np.float32) / 255.0); img_arr = np.transpose(img_arr, (2,0,1))
	img_tensor = torch.tensor(img_arr[None], dtype=torch.float32).to(DEVICE)
	df = pd.read_csv(csv_snippet_file.name)
	if df.shape[0] < SEQ_LEN:
	return f"CSV snippet too short. Need at least {SEQ_LEN} rows.", None
	required = {"Open","High","Low","Close","Volume"}
	if not required.issubset(set(df.columns)):
	return f"CSV snippet must have columns: {required}", None
	scaler = joblib.load(scaler_path)
	feats = df[["Open","High","Low","Close","Volume"]].values.astype(np.float32)
	feats_scaled = scaler.transform(feats)
	seq_arr = feats_scaled[-SEQ_LEN:]
	seq_tensor = torch.tensor(seq_arr[None], dtype=torch.float32).to(DEVICE)
	with torch.no_grad():
	logits = model(img_tensor, seq_tensor)
	probs = torch.softmax(logits, dim=-1).cpu().numpy()[0]
	idx = int(probs.argmax())
	return LABELS[idx], {LABELS[i]: float(probs[i]) for i in range(len(LABELS))}

	# -------------------------
	# Batch predict with ATR-based SL/TP + HTML report
	# -------------------------
	def batch_predict_extract_trades_atr(full_csv_file, stop_mult=1.0, tp_mult=2.0, atr_period=14, max_hold=32, scaler_path=os.path.join(MODEL_DIR,"csv_scaler.pkl")):
	"""
	Sliding-window sequence-only predictions and ATR-based stop/take management.
	stop_mult: ATR multiplier for stop loss (e.g., 1.0)
	tp_mult: ATR multiplier for take profit (e.g., 2.0)
	atr_period: ATR period length (default 14)
	"""
	# require scaler & model
	if not os.path.exists(scaler_path):
	return None, None, None, "CSV scaler not found. Train first."
	model = load_multimodal_model()
	if model is None:
	return None, None, None, "No trained multimodal model found."
	scaler = joblib.load(scaler_path)
	# load & clean df
	df = handle_ohlcv_csv(full_csv_file)
	n = df.shape[0]
	if n < SEQ_LEN:
	return None, None, None, f"CSV too short: need at least {SEQ_LEN} rows."

	feats = df[["Open","High","Low","Close","Volume"]].values.astype(np.float32)
	feats_scaled = scaler.transform(feats)

	# sliding windows (same as earlier)
	windows = []
	indices = []
	for end_idx in range(SEQ_LEN-1, n):
	start = end_idx - (SEQ_LEN-1)
	windows.append(feats_scaled[start:end_idx+1])
	indices.append(end_idx)
	X = np.stack(windows) # (B, SEQ_LEN, features)

	# predict using sequence branch (zero image emb)
	device = DEVICE
	preds = []
	probs_all = []
	with torch.no_grad():
	B = X.shape[0]
	batch_size = SEQ_BATCH
	for i in range(0, B, batch_size):
	xb = torch.tensor(X[i:i+batch_size], dtype=torch.float32).to(device)
	seq_emb = model.seq_model(xb) # (b, emb_size)
	zero_img_emb = torch.zeros_like(seq_emb)
	head_in = torch.cat([zero_img_emb, seq_emb], dim=1)
	logits = model.head(head_in)
	probs = torch.softmax(logits, dim=-1).cpu().numpy()
	batch_preds = probs.argmax(axis=1)
	preds.extend(batch_preds.tolist())
	probs_all.extend(probs.tolist())

	label_series = [None] * (SEQ_LEN-1) + [LABELS[int(p)] for p in preds]
	prob_series = [None] * (SEQ_LEN-1) + [probs_all[i] for i in range(len(preds))]

	# compute ATR
	atr = compute_atr(df, n=atr_period) # numpy array

	trades = []
	state = "flat"
	entry_idx = None
	entry_price = None
	side = None
	hold_count = 0

	t = SEQ_LEN-1
	while t < n:
	lab = label_series[t]
	# enter
	if state == "flat":
	if lab == "Buy" or lab == "Sell":
	# entry at next candle open if possible
	entry_idx = t+1 if (t+1 < n) else t
	entry_open = float(df["Open"].iloc[entry_idx]) if (t+1 < n) else float(df["Close"].iloc[t])
	entry_price = entry_open
	side = "Long" if lab == "Buy" else "Short"
	# determine ATR at entry index (use most recent available)
	atr_val = float(atr[entry_idx]) if entry_idx < len(atr) else float(atr[-1])
	if np.isnan(atr_val) or atr_val == 0:
	# fallback: use close-open
	atr_val = float(abs(df["Close"].iloc[entry_idx] - df["Open"].iloc[entry_idx]))
	if atr_val == 0:
	atr_val = 1e-6
	if side == "Long":
	stop_price = entry_price - stop_mult * atr_val
	take_price = entry_price + tp_mult * atr_val
	else:
	stop_price = entry_price + stop_mult * atr_val
	take_price = entry_price - tp_mult * atr_val
	hold_count = 0
	# start scanning from entry candle (inclusive) for stop/take/opposite signal
	i = entry_idx
	exited = False
	while i < n:
	# examine candle i high/low
	high_i = float(df["High"].iloc[i])
	low_i = float(df["Low"].iloc[i])
	# check stop / take first (intra-candle)
	if side == "Long":
	if low_i <= stop_price:
	exit_price = stop_price
	exit_idx = i
	reason = "stop"
	exited = True
	elif high_i >= take_price:
	exit_price = take_price
	exit_idx = i
	reason = "take"
	exited = True
	else: # Short
	if high_i >= stop_price:
	exit_price = stop_price
	exit_idx = i
	reason = "stop"
	exited = True
	elif low_i <= take_price:
	exit_price = take_price
	exit_idx = i
	reason = "take"
	exited = True
	if exited:
	# record trade
	if side == "Long":
	pnl = exit_price / entry_price - 1.0
	else:
	pnl = entry_price / exit_price - 1.0
	trades.append({
	"entry_idx": entry_idx,
	"entry_time": df["Date"].iloc[entry_idx] if "Date" in df.columns else int(entry_idx),
	"entry_price": entry_price,
	"exit_idx": exit_idx,
	"exit_time": df["Date"].iloc[exit_idx] if "Date" in df.columns else int(exit_idx),
	"exit_price": exit_price,
	"side": side,
	"pnl": pnl,
	"exit_reason": reason
	})
	state = "flat"
	entry_idx = None; entry_price = None; side = None
	# move t to exit_idx + 1
	t = exit_idx + 1
	break
	# check opposite signal at this candle's aligned label (label_series aligned to window end)
	lab_i = label_series[i] if i < len(label_series) else None
	if (side == "Long" and lab_i == "Sell") or (side == "Short" and lab_i == "Buy"):
	# exit at next open if exists
	exit_idx = i+1 if (i+1 < n) else i
	exit_price = float(df["Open"].iloc[exit_idx]) if (i+1 < n) else float(df["Close"].iloc[i])
	reason = "opp_signal"
	if side == "Long":
	pnl = exit_price / entry_price - 1.0
	else:
	pnl = entry_price / exit_price - 1.0
	trades.append({
	"entry_idx": entry_idx,
	"entry_time": df["Date"].iloc[entry_idx] if "Date" in df.columns else int(entry_idx),
	"entry_price": entry_price,
	"exit_idx": exit_idx,
	"exit_time": df["Date"].iloc[exit_idx] if "Date" in df.columns else int(exit_idx),
	"exit_price": exit_price,
	"side": side,
	"pnl": pnl,
	"exit_reason": reason
	})
	state = "flat"
	entry_idx = None; entry_price = None; side = None
	t = exit_idx + 1
	exited = True
	break
	# hold count
	hold_count += 1
	if hold_count >= max_hold:
	exit_idx = i+1 if (i+1 < n) else i
	exit_price = float(df["Open"].iloc[exit_idx]) if (i+1 < n) else float(df["Close"].iloc[i])
	reason = "max_hold"
	if side == "Long":
	pnl = exit_price / entry_price - 1.0
	else:
	pnl = entry_price / exit_price - 1.0
	trades.append({
	"entry_idx": entry_idx,
	"entry_time": df["Date"].iloc[entry_idx] if "Date" in df.columns else int(entry_idx),
	"entry_price": entry_price,
	"exit_idx": exit_idx,
	"exit_time": df["Date"].iloc[exit_idx] if "Date" in df.columns else int(exit_idx),
	"exit_price": exit_price,
	"side": side,
	"pnl": pnl,
	"exit_reason": reason
	})
	state = "flat"
	entry_idx = None; entry_price = None; side = None
	t = exit_idx + 1
	exited = True
	break
	# continue to next candle
	i += 1
	if not exited:
	# reached end of series without exit -> close at last close
	exit_idx = n-1
	exit_price = float(df["Close"].iloc[exit_idx])
	reason = "eod"
	if side == "Long":
	pnl = exit_price / entry_price - 1.0
	else:
	pnl = entry_price / exit_price - 1.0
	trades.append({
	"entry_idx": entry_idx,
	"entry_time": df["Date"].iloc[entry_idx] if "Date" in df.columns else int(entry_idx),
	"entry_price": entry_price,
	"exit_idx": exit_idx,
	"exit_time": df["Date"].iloc[exit_idx] if "Date" in df.columns else int(exit_idx),
	"exit_price": exit_price,
	"side": side,
	"pnl": pnl,
	"exit_reason": reason
	})
	return _save_and_report(df, trades) # end
	continue # continue outer while (t already advanced to exit_idx+1)
	# increment t if no entry or after handled
	t += 1

	# done scanning
	return _save_and_report(df, trades)

	def _save_and_report(df, trades):
	# save trades CSV
	trades_df = pd.DataFrame(trades)
	ts = int(datetime.utcnow().timestamp())
	trades_csv_path = os.path.join(MODEL_DIR, f"trades_{ts}.csv")
	trades_df.to_csv(trades_csv_path, index=False)

	# make plot
	plt.figure(figsize=(12,5))
	plt.plot(df.index, df["Close"].values, label="Close")
	entries_x = []
	entries_y = []
	exits_x = []
	exits_y = []
	colors = []
	for tr in trades:
	eidx = int(tr["entry_idx"]); exidx = int(tr["exit_idx"])
	entries_x.append(eidx); entries_y.append(tr["entry_price"])
	exits_x.append(exidx); exits_y.append(tr["exit_price"])
	colors.append("g" if tr["side"]=="Long" else "r")
	# plot entries/exits
	if len(entries_x):
	for (x,y,c) in zip(entries_x, entries_y, colors):
	plt.scatter([x],[y], marker="o", color=c, zorder=5)
	if len(exits_x):
	for (x,y,c) in zip(exits_x, exits_y, colors):
	plt.scatter([x],[y], marker="x", color=c, zorder=5)
	plt.title("Close price with entries (o) and exits (x)")
	plt.xlabel("index")
	plt.ylabel("Close")
	plt.legend()
	plot_path = os.path.join(MODEL_DIR, f"trades_plot_{ts}.png")
	plt.tight_layout()
	plt.savefig(plot_path)
	plt.close()

	# compute metrics
	if trades_df.empty:
	summary_text = "No trades generated."
	report_path = _generate_html_report(df, trades_df, plot_path, summary_text, {})
	return trades_csv_path, plot_path, report_path, summary_text
	pnl_list = trades_df["pnl"].astype(float).values
	total_pnl = float(np.nansum(pnl_list))
	avg_pnl = float(np.nanmean(pnl_list))
	wins = float((pnl_list > 0).sum())
	win_rate = float(wins / len(pnl_list)) if len(pnl_list) > 0 else 0.0

	# equity curve (assume 1 unit risk per trade, returns additively)
	# we'll build cumulative returns as (1 + pnl) multiplicatively for realistic equity growth
	equity = np.cumprod(1 + pnl_list) # start at 1
	peak = np.maximum.accumulate(equity)
	drawdowns = (peak - equity) / peak
	max_dd = float(np.max(drawdowns)) if len(drawdowns)>0 else 0.0

	summary = {
	"n_trades": int(len(pnl_list)),
	"total_pnl": total_pnl,
	"avg_pnl": avg_pnl,
	"win_rate": win_rate,
	"max_drawdown": max_dd
	}
	summary_text = f"Trades: {summary['n_trades']}, Total PnL (factorized): {summary['total_pnl']:.4f}, Win rate: {summary['win_rate']:.3f}, Max Drawdown: {summary['max_drawdown']:.3f}"
	report_path = _generate_html_report(df, trades_df, plot_path, summary_text, summary)
	return trades_csv_path, plot_path, report_path, summary_text

	def _generate_html_report(df, trades_df, plot_path, summary_text, summary):
	# embed plot as base64
	with open(plot_path, "rb") as f:
	img_b64 = base64.b64encode(f.read()).decode("ascii")
	img_tag = f'<img src="data:image/png;base64,{img_b64}" style="max-width:100%;height:auto;" />'

	# trades table html
	if trades_df.empty:
	trades_html = "<p>No trades</p>"
	else:
	trades_html = trades_df.to_html(classes="table table-striped", index=False, float_format="%.6f")

	# summary HTML block
	summary_html = "<ul>"
	for k,v in summary.items():
	summary_html += f"<li><strong>{k}</strong>: {v}</li>"
	summary_html += "</ul>"

	html = f"""
	<html>
	<head>
	<meta charset="utf-8"/>
	<title>SMC Multimodal - ATR Trades Report</title>
	<style>
	body {{ font-family: Arial, sans-serif; margin: 20px; }}
	.header {{ margin-bottom: 20px; }}
	.section {{ margin-bottom: 30px; }}
	table {{ border-collapse: collapse; width: 100%; }}
	table, th, td {{ border: 1px solid #ddd; }}
	th, td {{ padding: 8px; text-align: left; }}
	th {{ background-color: #f2f2f2; }}
	</style>
	</head>
	<body>
	<div class="header">
	<h1>SMC Multimodal - ATR Trades Report</h1>
	<p>Generated: {datetime.utcnow().isoformat()} UTC</p>
	<p>{summary_text}</p>
	</div>
	<div class="section">
	<h2>Price chart with trades</h2>
	{img_tag}
	</div>
	<div class="section">
	<h2>Trades</h2>
	{trades_html}
	</div>
	<div class="section">
	<h2>Summary metrics</h2>
	{summary_html}
	</div>
	</body>
	</html>
	"""
	ts = int(datetime.utcnow().timestamp())
	report_path = os.path.join(MODEL_DIR, f"report_{ts}.html")
	with open(report_path, "w", encoding="utf-8") as f:
	f.write(html)
	return report_path

	# -------------------------
	# The rest (Gemini, auto-label, training) left mostly unchanged from earlier app
	# For brevity, reuse previous functions for ai_teacher and training wrappers.
	# (You can paste the previous implementation here for a full runnable app.)
	# -------------------------
	# For this response I will implement minimal wrappers to keep the app runnable:
	GENAI_API_KEY = os.environ.get("GENAI_API_KEY") or os.environ.get("GOOGLE_API_KEY")

	PROMPT_JSON_SCHEMA = f"""
	You are a chart-analysis assistant. INPUT: a candlestick chart image (standard candlestick, no overlays).
	You MUST OUTPUT a single JSON object only (no explanatory text). Schema:

	{{
	"label": "Buy" \| "Sell" \| "Hold",
	"confidence": 0.0-1.0,
	"seq_start": <integer index into the provided OHLCV CSV> OR a date string "YYYY-MM-DD" (one of the two),
	"note": "brief explanation (optional)"
	}}

	Constraints:
	- Only output valid JSON following exactly the keys above.
	- If uncertain, return confidence < 0.6.
	- seq_start should be either an integer or an ISO date string (not both).
	- Do NOT include any other keys.
	"""

	def ai_teacher_with_gemini(image_bytes: bytes, prompt_extra: str = "") -> dict:
	if genai is None:
	raise RuntimeError("google-genai package not installed. pip install google-generativeai")
	api_key = GENAI_API_KEY
	if not api_key:
	raise RuntimeError("Set GENAI_API_KEY environment variable with your Gemini API key.")
	client = genai.Client(api_key=api_key)
	prompt = PROMPT_JSON_SCHEMA + "\n" + prompt_extra
	pil_img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
	contents = [prompt, pil_img]
	response = client.models.generate_content(model="gemini-2.5-flash", contents=contents, temperature=0.0, max_output_tokens=800, response_format="TEXT")
	text = None
	try:
	cand = response.candidates[0]
	if hasattr(cand, "content") and hasattr(cand.content, "parts"):
	parts = cand.content.parts
	collected = []
	for p in parts:
	if getattr(p, "text", None):
	collected.append(p.text)
	text = "\n".join(collected).strip()
	else:
	text = str(response)
	except Exception:
	text = str(response)
	try:
	parsed = json.loads(text)
	except Exception:
	import re
	m = re.search(r"(\{.*\})", text, flags=re.S)
	if not m:
	raise ValueError(f"Could not parse JSON from model response: {text[:500]}")
	parsed = json.loads(m.group(1))
	return parsed

	# Minimal stubs for auto-label/train/predict wrappers so UI launches
	AUTO_IMAGES_DIR = os.path.join(AUTO_DIR, "images")
	os.makedirs(AUTO_IMAGES_DIR, exist_ok=True)
	AUTO_MAPPING_CSV = os.path.join(AUTO_DIR, "mapping_auto.csv")
	if not os.path.exists(AUTO_MAPPING_CSV):
	pd.DataFrame(columns=["filename","label","seq_start"]).to_csv(AUTO_MAPPING_CSV, index=False)

	def ui_ai_label_and_suggest(img_filepath, ohlcv_csv=None):
	return "AI tab not active in this trimmed example (install GenAI)", "{}", None, img_filepath

	def ui_accept_auto_label(img_filepath, parsed_json_text, seq_start_override, save_prefix="auto"):
	return "Not implemented in trimmed example", None

	def ui_train_from_auto(ohlcv_csv, epochs=EPOCHS):
	return "Train-from-auto not implemented in trimmed example", None

	def ui_train_multimodal_wrapper(img_zip_file, mapping_file, ohlcv_file_in, epochs_in):
	return "Train wrapper not implemented in trimmed example", None

	def ui_predict_multimodal(img_filepath, csv_snippet_file):
	try:
	with open(img_filepath, "rb") as f:
	image_bytes = f.read()
	except Exception as e:
	return f"Could not read image file: {e}", None, None
	try:
	label, probs = predict_multimodal(image_bytes, csv_snippet_file)
	return label, str(probs), img_filepath
	except Exception as e:
	return f"Prediction error: {e}", None, None

	def ui_batch_predict_and_export(full_csv_file, stop_mult, tp_mult, atr_period, max_hold):
	try:
	trades_csv, plot_path, report_path, msg = batch_predict_extract_trades_atr(full_csv_file, stop_mult=float(stop_mult), tp_mult=float(tp_mult), atr_period=int(atr_period), max_hold=int(max_hold))
	if trades_csv is None:
	return msg, None, None, None
	return msg, trades_csv, plot_path, report_path
	except Exception as e:
	return f"Batch predict error: {e}", None, None, None

	# -------------------------
	# Build Gradio UI
	# -------------------------
	with gr.Blocks() as demo:
	gr.Markdown("# SMC Multimodal Trainer + ATR-based Trade Extraction & HTML Report")

	with gr.Tab("Query / Batch Predict (ATR)"):
	gr.Markdown("Upload a full OHLCV CSV and choose ATR/SL/TP settings to generate trades and an HTML report.")
	full_csv = gr.File(label="Full OHLCV CSV (for batch prediction)")
	with gr.Row():
	stop_mult_input = gr.Number(value=1.0, label="Stop ATR multiplier (stop = entry ± ATR * stop_mult)")
	tp_mult_input = gr.Number(value=2.0, label="TakeProfit ATR multiplier (take = entry ± ATR * tp_mult)")
	atr_period_input = gr.Number(value=14, label="ATR period")
	max_hold_input = gr.Number(value=32, label="Max holding candles")
	batch_btn = gr.Button("Batch Predict -> ATR trades + report")
	batch_out = gr.Textbox(label="Batch Output")
	batch_trades_file = gr.File(label="Trades CSV (download)")
	batch_plot = gr.Image(label="Trades plot (entries/exits)")
	batch_report = gr.File(label="HTML report (download)")
	batch_btn.click(fn=ui_batch_predict_and_export, inputs=[full_csv, stop_mult_input, tp_mult_input, atr_period_input, max_hold_input], outputs=[batch_out, batch_trades_file, batch_plot, batch_report])

	with gr.Tab("Notes"):
	gr.Markdown("""
	ATR-based trade simulation notes
	- This simulator uses ATR for stop loss and take profit levels.
	- Entry is at next candle Open after the signal.
	- The simulator checks each candle to see if SL/TP hit (intra-candle).
	- If the opposite model signal appears, it exits at the next open.
	- HTML report includes embedded plot and trade table, plus summary metrics (win rate, max drawdown).
	- Validate the results and tune multipliers (stop_mult / tp_mult) before trusting strategies.
	""")

	if __name__ == "__main__":
	demo.launch(debug=True, share=False)