Spaces:

P2SAMAPA
/

P2-ETF-DQN-ENGINE

Running

App Files Files Community

P2-ETF-DQN-ENGINE / predict.py

P2SAMAPA

[auto] Deploy to HF Space from GitHub

c309d08 verified 1 day ago

raw

history blame contribute delete

9.27 kB

	# predict.py
	# Generates next-trading-day ETF signal from saved DQN weights.
	# Usage:
	# python predict.py --tsl 10 --z 1.1

	import argparse
	import json
	import os
	import shutil
	from datetime import datetime, date, timedelta, timezone

	import numpy as np
	import pandas as pd

	import config
	from data_download import load_local
	from features import build_features
	from agent import DQNAgent

	WEIGHTS_PATH = os.path.join(config.MODELS_DIR, "dqn_best.pt")
	SUMMARY_PATH = os.path.join(config.MODELS_DIR, "training_summary.json")
	PRED_PATH = "latest_prediction.json"

	def next_trading_day(from_date=None) -> date:
	"""Returns next NYSE trading day using pandas_market_calendars — no hardcoded holidays."""
	try:
	import pandas_market_calendars as mcal
	nyse = mcal.get_calendar("NYSE")
	start = from_date or date.today()
	sched = nyse.schedule(
	start_date=start.strftime("%Y-%m-%d"),
	end_date=(start + timedelta(days=14)).strftime("%Y-%m-%d"),
	)
	trading_dates = [d.date() for d in mcal.date_range(sched, frequency="1D")]
	for d in trading_dates:
	if d > start:
	return d
	except Exception:
	pass
	# Fallback: weekend skip only
	d = (from_date or date.today()) + timedelta(days=1)
	while d.weekday() >= 5:
	d += timedelta(days=1)
	return d


	def _q_zscore(q_vals: np.ndarray) -> np.ndarray:
	mu = q_vals.mean()
	std = q_vals.std() + 1e-9
	return (q_vals - mu) / std


	def download_from_hf():
	"""Pull weights + data from HF Dataset if not present locally."""
	try:
	from huggingface_hub import hf_hub_download
	token = config.HF_TOKEN or None
	os.makedirs(config.DATA_DIR, exist_ok=True)
	os.makedirs(config.MODELS_DIR, exist_ok=True)

	for f in ["etf_prices", "macro"]:
	try:
	dl = hf_hub_download(repo_id=config.HF_DATASET_REPO,
	filename=f"data/{f}.parquet",
	repo_type="dataset", token=token)
	shutil.copy(dl, os.path.join(config.DATA_DIR, f"{f}.parquet"))
	except Exception as e:
	print(f" data/{f}: {e}")

	for f in ["dqn_best.pt", "training_summary.json"]:
	try:
	dl = hf_hub_download(repo_id=config.HF_DATASET_REPO,
	filename=f"models/{f}",
	repo_type="dataset", token=token)
	shutil.copy(dl, os.path.join(config.MODELS_DIR, f))
	print(f" ✓ models/{f}")
	except Exception as e:
	print(f" models/{f}: {e}")
	except Exception as e:
	print(f" HF download failed: {e}")


	def run_predict(tsl_pct: float = config.DEFAULT_TSL_PCT,
	z_reentry: float = config.DEFAULT_Z_REENTRY) -> dict:

	print(f"\n{'='*60}")
	print(f" Predict — {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}")
	print(f"{'='*60}")

	# ── Ensure data + weights ─────────────────────────────────────────────────
	data = load_local()
	if not data:
	print(" No local data — downloading from HF...")
	download_from_hf()
	data = load_local()
	if not data:
	print(" ERROR: No data available.")
	return {}

	if not os.path.exists(WEIGHTS_PATH):
	print(" No local weights — downloading from HF...")
	download_from_hf()
	if not os.path.exists(WEIGHTS_PATH):
	print(" ERROR: No weights available.")
	return {}

	# ── Load training metadata ────────────────────────────────────────────────
	trained_from_year = None
	trained_at = None
	lookback = config.LOOKBACK_WINDOW
	if os.path.exists(SUMMARY_PATH):
	with open(SUMMARY_PATH) as f:
	summary = json.load(f)
	trained_from_year = summary.get("start_year")
	trained_at = summary.get("trained_at")
	lookback = summary.get("lookback", config.LOOKBACK_WINDOW)

	# ── Build features ────────────────────────────────────────────────────────
	etf_prices = data["etf_prices"]
	macro = data["macro"]
	feat_df = build_features(etf_prices, macro)

	# ── Load agent ────────────────────────────────────────────────────────────
	# FIX: state_size must match env.py — flattened window + one-hot position (n_actions)
	state_size = feat_df.shape[1] * lookback + config.N_ACTIONS
	agent = DQNAgent(state_size=state_size)
	agent.load(WEIGHTS_PATH)

	# ── Build current state (last lookback rows) ──────────────────────────────
	window = feat_df.iloc[-lookback:].values.astype(np.float32)
	if len(window) < lookback:
	pad = np.zeros((lookback - len(window), feat_df.shape[1]), dtype=np.float32)
	window = np.vstack([pad, window])
	# FIX: append one-hot position — assume CASH at inference start (index 0)
	position = np.zeros(config.N_ACTIONS, dtype=np.float32)
	position[0] = 1.0 # CASH
	state = np.concatenate([window.flatten(), position])

	# ── Inference ─────────────────────────────────────────────────────────────
	q_values = agent.q_values(state)
	z_scores = _q_zscore(q_values)
	best_idx = int(q_values.argmax())
	best_z = float(z_scores[best_idx])

	# T-bill rate
	tbill_rate = 3.6
	if "macro_TBILL_3M" in feat_df.columns:
	val = feat_df["macro_TBILL_3M"].iloc[-1]
	if not np.isnan(val):
	tbill_rate = float(val)

	# TSL / re-entry check using last 2 days
	tsl_triggered = False
	in_cash = False
	two_day_ret = 0.0
	if best_idx != 0:
	etf = config.ACTIONS[best_idx]
	if etf in etf_prices.columns:
	last2 = etf_prices[etf].iloc[-3:]
	two_day_ret = float((last2.iloc[-1] / last2.iloc[0]) - 1) * 100
	if two_day_ret <= -tsl_pct:
	tsl_triggered = True
	if best_z < z_reentry:
	in_cash = True

	final_signal = "CASH" if in_cash else config.ACTIONS[best_idx]

	# Signal date — use NYSE calendar
	now_est = datetime.now(timezone.utc).replace(tzinfo=None) - timedelta(hours=5)
	today = now_est.date()
	try:
	import pandas_market_calendars as mcal
	nyse = mcal.get_calendar("NYSE")
	sched = nyse.schedule(
	start_date=today.strftime("%Y-%m-%d"),
	end_date=today.strftime("%Y-%m-%d"),
	)
	is_trading_day = not sched.empty
	except Exception:
	is_trading_day = today.weekday() < 5
	if is_trading_day and now_est.hour < 16:
	signal_date = today
	else:
	signal_date = next_trading_day(today)

	# Per-action probabilities (softmax of Q-values for display)
	q_shifted = q_values - q_values.max()
	exp_q = np.exp(q_shifted / 0.1)
	probs = exp_q / exp_q.sum()
	prob_dict = {config.ACTIONS[i]: round(float(probs[i]), 4)
	for i in range(config.N_ACTIONS)}

	output = dict(
	as_of_date = str(signal_date),
	final_signal = final_signal,
	final_confidence = round(float(probs[best_idx]), 4),
	z_score = round(best_z, 3),
	q_values = {config.ACTIONS[i]: round(float(q_values[i]), 4)
	for i in range(config.N_ACTIONS)},
	probabilities = prob_dict,
	tbill_rate = round(tbill_rate, 3),
	tsl_status = dict(
	two_day_cumul_pct = round(two_day_ret, 2),
	tsl_triggered = tsl_triggered,
	in_cash = in_cash,
	z_reentry = z_reentry,
	tsl_pct = tsl_pct,
	),
	trained_from_year = trained_from_year,
	trained_at = trained_at,
	)

	with open(PRED_PATH, "w") as f:
	json.dump(output, f, indent=2, default=str)

	print(f"\n Signal date : {signal_date}")
	print(f" Final signal : {final_signal}")
	print(f" Z-score : {best_z:.2f}σ")
	print(f" Confidence : {float(probs[best_idx]):.1%}")
	for act, p in prob_dict.items():
	print(f" {act:<8} Q={q_values[config.ACTIONS.index(act)]:.3f} p={p:.3f}")
	print(f"\n Saved → {PRED_PATH}")

	return output


	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument("--tsl", type=float, default=config.DEFAULT_TSL_PCT)
	parser.add_argument("--z", type=float, default=config.DEFAULT_Z_REENTRY)
	args = parser.parse_args()
	run_predict(tsl_pct=args.tsl, z_reentry=args.z)