Spaces:

P2SAMAPA
/

P2-ETF-DQN-ENGINE

Running

App Files Files Community

P2-ETF-DQN-ENGINE / features.py

P2SAMAPA

[auto] Deploy DQN code + results to HF Space

5822cc5 verified 3 days ago

raw

history blame contribute delete

9.24 kB

	# features.py
	# Builds the DQN state matrix from raw price and macro data.
	# Implements the 20 technical indicators from:
	# Yasin & Gill (2024) "Reinforcement Learning Framework for Quantitative Trading"
	# arXiv:2411.07585 — ICAIF 2024 FM4TS Workshop

	import numpy as np
	import pandas as pd

	import config


	# ── Individual indicator functions ───────────────────────────────────────────

	def _rsi(series: pd.Series, period: int = 14) -> pd.Series:
	delta = series.diff()
	gain = delta.clip(lower=0).rolling(period).mean()
	loss = (-delta.clip(upper=0)).rolling(period).mean()
	rs = gain / (loss + 1e-9)
	return 100 - (100 / (1 + rs))


	def _macd(series: pd.Series, fast=12, slow=26, signal=9):
	ema_fast = series.ewm(span=fast, adjust=False).mean()
	ema_slow = series.ewm(span=slow, adjust=False).mean()
	macd_line = ema_fast - ema_slow
	signal_line= macd_line.ewm(span=signal, adjust=False).mean()
	histogram = macd_line - signal_line
	return macd_line, signal_line, histogram


	def _stochastic(high: pd.Series, low: pd.Series, close: pd.Series,
	period: int = 14) -> pd.Series:
	lowest = low.rolling(period).min()
	highest = high.rolling(period).max()
	return 100 * (close - lowest) / (highest - lowest + 1e-9)


	def _cci(high: pd.Series, low: pd.Series, close: pd.Series,
	period: int = 20) -> pd.Series:
	tp = (high + low + close) / 3
	sma_tp = tp.rolling(period).mean()
	mad = tp.rolling(period).apply(lambda x: np.mean(np.abs(x - x.mean())), raw=True)
	return (tp - sma_tp) / (0.015 * mad + 1e-9)


	def _roc(series: pd.Series, period: int = 10) -> pd.Series:
	return ((series - series.shift(period)) / (series.shift(period) + 1e-9)) * 100


	def _cmo(series: pd.Series, period: int = 14) -> pd.Series:
	delta = series.diff()
	up = delta.clip(lower=0).rolling(period).sum()
	down = (-delta.clip(upper=0)).rolling(period).sum()
	return 100 * (up - down) / (up + down + 1e-9)


	def _williams_r(high: pd.Series, low: pd.Series, close: pd.Series,
	period: int = 14) -> pd.Series:
	highest = high.rolling(period).max()
	lowest = low.rolling(period).min()
	return -100 * (highest - close) / (highest - lowest + 1e-9)


	def _atr(high: pd.Series, low: pd.Series, close: pd.Series,
	period: int = 14) -> pd.Series:
	tr = pd.concat([
	high - low,
	(high - close.shift(1)).abs(),
	(low - close.shift(1)).abs(),
	], axis=1).max(axis=1)
	return tr.rolling(period).mean()


	def _bbands(series: pd.Series, period: int = 20):
	sma = series.rolling(period).mean()
	std = series.rolling(period).std()
	upper = sma + 2 * std
	lower = sma - 2 * std
	pct_b = (series - lower) / (upper - lower + 1e-9) # %B oscillator
	width = (upper - lower) / (sma + 1e-9)
	return pct_b, width


	def _stoch_rsi(series: pd.Series, rsi_period=14, stoch_period=14) -> pd.Series:
	rsi = _rsi(series, rsi_period)
	min_rsi = rsi.rolling(stoch_period).min()
	max_rsi = rsi.rolling(stoch_period).max()
	return (rsi - min_rsi) / (max_rsi - min_rsi + 1e-9)


	def _ultimate_oscillator(high, low, close, s=7, m=14, l=28) -> pd.Series:
	prev_close = close.shift(1)
	bp = close - pd.concat([low, prev_close], axis=1).min(axis=1)
	tr = pd.concat([high, prev_close], axis=1).max(axis=1) - \
	pd.concat([low, prev_close], axis=1).min(axis=1)
	avg_s = bp.rolling(s).sum() / (tr.rolling(s).sum() + 1e-9)
	avg_m = bp.rolling(m).sum() / (tr.rolling(m).sum() + 1e-9)
	avg_l = bp.rolling(l).sum() / (tr.rolling(l).sum() + 1e-9)
	return 100 * (4 * avg_s + 2 * avg_m + avg_l) / 7


	def _momentum(series: pd.Series, period: int = 10) -> pd.Series:
	return series - series.shift(period)


	def _rolling_zscore(series: pd.Series, window: int = 60) -> pd.Series:
	mu = series.rolling(window, min_periods=10).mean()
	std = series.rolling(window, min_periods=10).std()
	return (series - mu) / (std + 1e-9)


	# ── Per-ETF feature builder ───────────────────────────────────────────────────

	def _etf_features(prices: pd.DataFrame, ticker: str) -> pd.DataFrame:
	"""
	Builds the 20 technical indicators for one ETF.
	Requires OHLCV — if only Close is available, High=Low=Close (safe fallback).
	"""
	close = prices[ticker]
	# yfinance returns OHLCV; if we only have close use it for H/L too
	high = prices.get(f"{ticker}_High", close)
	low = prices.get(f"{ticker}_Low", close)

	ret = close.pct_change()
	feat = pd.DataFrame(index=prices.index)

	# 1. RSI
	feat[f"{ticker}_RSI"] = _rsi(close, config.RSI_PERIOD)
	# 2-4. MACD line, signal, histogram
	ml, sl, hist = _macd(close, config.MACD_FAST, config.MACD_SLOW, config.MACD_SIGNAL)
	feat[f"{ticker}_MACD"] = ml
	feat[f"{ticker}_MACD_sig"] = sl
	feat[f"{ticker}_MACD_hist"] = hist
	# 5. Stochastic %K
	feat[f"{ticker}_Stoch"] = _stochastic(high, low, close, config.STOCH_PERIOD)
	# 6. CCI
	feat[f"{ticker}_CCI"] = _cci(high, low, close, config.CCI_PERIOD)
	# 7. ROC
	feat[f"{ticker}_ROC"] = _roc(close, config.ROC_PERIOD)
	# 8. CMO
	feat[f"{ticker}_CMO"] = _cmo(close, config.CMO_PERIOD)
	# 9. Williams %R
	feat[f"{ticker}_WillR"] = _williams_r(high, low, close)
	# 10. ATR (normalised by close)
	feat[f"{ticker}_ATR"] = _atr(high, low, close, config.ATR_PERIOD) / (close + 1e-9)
	# 11-12. Bollinger %B and width
	pctb, bw = _bbands(close, config.BBANDS_PERIOD)
	feat[f"{ticker}_BB_pctB"] = pctb
	feat[f"{ticker}_BB_width"] = bw
	# 13. StochRSI
	feat[f"{ticker}_StochRSI"] = _stoch_rsi(close, config.RSI_PERIOD, config.STOCH_PERIOD)
	# 14. Ultimate Oscillator
	feat[f"{ticker}_UO"] = _ultimate_oscillator(high, low, close)
	# 15. Momentum
	feat[f"{ticker}_Mom"] = _momentum(close, config.ROC_PERIOD)
	# 16-19. Rolling returns: 1d, 5d, 10d, 21d
	for lag in [1, 5, 10, 21]:
	feat[f"{ticker}_Ret{lag}d"] = close.pct_change(lag)
	# 20. Realised vol (21d annualised)
	feat[f"{ticker}_Vol21d"] = ret.rolling(21).std() * np.sqrt(252)

	return feat


	# ── Macro feature builder ─────────────────────────────────────────────────────

	def _macro_features(macro: pd.DataFrame) -> pd.DataFrame:
	feat = pd.DataFrame(index=macro.index)
	for col in macro.columns:
	feat[f"macro_{col}"] = macro[col]
	# z-score each macro series with 60d rolling window
	feat[f"macro_{col}_Z"] = _rolling_zscore(macro[col], 60)
	return feat


	# ── Master feature matrix ─────────────────────────────────────────────────────

	def build_features(etf_prices: pd.DataFrame,
	macro: pd.DataFrame,
	start_year: int = None) -> pd.DataFrame:
	"""
	Builds the full feature matrix aligned on trading days.
	Returns a DataFrame where each row is one day's state vector.
	"""
	frames = []

	# Technical indicators for each target ETF
	for ticker in config.ETFS:
	if ticker in etf_prices.columns:
	frames.append(_etf_features(etf_prices, ticker))

	# Macro features
	if not macro.empty:
	frames.append(_macro_features(macro))

	feat = pd.concat(frames, axis=1, join="outer")

	# Forward-fill macro (released less frequently than daily)
	feat = feat.ffill(limit=5)

	# Align to ETF trading days only (drop weekends / holidays)
	etf_idx = etf_prices[config.ETFS[0]].dropna().index
	feat = feat.reindex(etf_idx).ffill(limit=5)

	# Filter by start year if provided
	if start_year:
	feat = feat[feat.index.year >= start_year]

	# Drop rows where >50% of features are NaN (warm-up rows)
	thresh = int(len(feat.columns) * 0.5)
	feat = feat.dropna(thresh=thresh)

	# Fill remaining NaNs with 0 (edge-of-history cases)
	feat = feat.fillna(0.0)

	return feat


	def get_feature_names(etf_prices: pd.DataFrame, macro: pd.DataFrame) -> list:
	"""Returns the list of feature column names (for debugging / UI display)."""
	feat = build_features(etf_prices, macro)
	return list(feat.columns)


	def make_state_windows(feat: pd.DataFrame,
	lookback: int = None) -> np.ndarray:
	"""
	Converts feature DataFrame into 3D array of shape
	(n_steps, lookback, n_features) for DQN consumption.
	Windows are stride-1 over the date axis.
	"""
	lb = lookback or config.LOOKBACK_WINDOW
	values = feat.values.astype(np.float32)
	n = len(values)
	if n < lb:
	raise ValueError(f"Not enough data: {n} rows < lookback {lb}")
	windows = np.stack([values[i : i + lb] for i in range(n - lb + 1)])
	return windows # (n - lb + 1, lb, n_features)