Upload meta_model.py

de3f3f3 verified 3 days ago

10.5 kB

	"""Meta-Model: Learns which model/signal to trust dynamically.

	This mimics how Renaissance Technologies combines signals — a meta-learner
	weights LSTM, Transformer, XGBoost, and sentiment based on recent performance,
	regime, and volatility state.
	"""
	import numpy as np
	import pandas as pd
	import torch
	import torch.nn as nn
	from sklearn.ensemble import GradientBoostingRegressor
	from typing import Dict, List, Optional, Tuple
	import warnings
	warnings.filterwarnings('ignore')


	class MetaModel:
	"""Meta-learner that dynamically weights base model predictions."""

	def __init__(self,
	base_models: List[str] = None,
	meta_learner_type: str = 'xgb',
	lookback_window: int = 63,
	device: str = 'cpu'):
	"""
	Args:
	base_models: Names of base models (e.g., ['lstm','transformer','xgboost','sentiment'])
	meta_learner_type: 'xgb', 'nn', or 'bayesian'
	lookback_window: How many days of past performance to use as features
	"""
	self.base_models = base_models or ['lstm', 'transformer', 'xgboost', 'sentiment']
	self.meta_learner_type = meta_learner_type
	self.lookback_window = lookback_window
	self.device = torch.device(device)

	self.meta_model = None
	self.performance_history = {m: [] for m in self.base_models}
	self.weight_history = []
	self.is_fitted = False

	def _build_meta_features(self,
	predictions: Dict[str, np.ndarray],
	regime: Optional[str] = None,
	volatility: Optional[float] = None,
	recent_returns: Optional[np.ndarray] = None) -> np.ndarray:
	"""
	Build feature vector for meta-learner.

	Features include:
	- Raw predictions from each base model
	- Recent IC of each model
	- Recent MSE of each model
	- Volatility regime
	- Recent market return
	"""
	n_samples = len(list(predictions.values())[0])
	features = []

	# Raw predictions
	for model in self.base_models:
	if model in predictions:
	features.append(predictions[model])
	else:
	features.append(np.zeros(n_samples))

	# Recent performance (rolling IC over lookback window)
	for model in self.base_models:
	perf = self.performance_history.get(model, [0.0] * self.lookback_window)
	# Pad if needed
	perf = perf[-self.lookback_window:]
	while len(perf) < self.lookback_window:
	perf = [0.0] + perf
	# Summary stats of recent performance
	features.append(np.full(n_samples, np.mean(perf)))
	features.append(np.full(n_samples, np.std(perf) if len(perf) > 1 else 0.0))
	features.append(np.full(n_samples, perf[-1] if perf else 0.0))

	# Regime encoding
	if regime:
	regime_map = {'bull': 1.0, 'bear': -1.0, 'high_vol': 0.0, 'neutral': 0.5}
	regime_val = regime_map.get(regime, 0.5)
	features.append(np.full(n_samples, regime_val))
	else:
	features.append(np.zeros(n_samples))

	# Volatility
	features.append(np.full(n_samples, volatility or 0.2))

	# Recent market return
	if recent_returns is not None and len(recent_returns) > 0:
	features.append(np.full(n_samples, np.mean(recent_returns[-5:])))
	else:
	features.append(np.zeros(n_samples))

	return np.column_stack(features)

	def fit(self,
	predictions_train: Dict[str, np.ndarray],
	actual_train: np.ndarray,
	regime_train: Optional[List[str]] = None,
	volatility_train: Optional[np.ndarray] = None) -> Dict:
	"""
	Train meta-learner to predict actual returns from base model predictions.

	The meta-learner learns optimal weights for combining base models.
	"""
	n_samples = len(actual_train)

	# Build meta-features
	X_meta = self._build_meta_features(
	predictions_train,
	regime=regime_train[0] if regime_train else None,
	volatility=volatility_train[0] if volatility_train is not None else None
	)

	if self.meta_learner_type == 'xgb':
	self.meta_model = GradientBoostingRegressor(
	n_estimators=100,
	max_depth=4,
	learning_rate=0.05,
	subsample=0.8,
	random_state=42
	)
	self.meta_model.fit(X_meta, actual_train)

	elif self.meta_learner_type == 'nn':
	self.meta_model = self._build_nn_meta_model(X_meta.shape[1])
	self._train_nn_meta(X_meta, actual_train)

	elif self.meta_learner_type == 'bayesian':
	# Use XGB with quantile loss for uncertainty
	self.meta_model = GradientBoostingRegressor(
	n_estimators=100,
	max_depth=4,
	learning_rate=0.05,
	loss='quantile', alpha=0.5,
	random_state=42
	)
	self.meta_model.fit(X_meta, actual_train)

	self.is_fitted = True

	# Compute in-sample performance
	pred = self.predict_meta(predictions_train, regime_train, volatility_train)
	from scipy.stats import spearmanr
	ic, _ = spearmanr(pred, actual_train)
	mse = np.mean((pred - actual_train) ** 2)

	return {
	'meta_ic': ic,
	'meta_mse': mse,
	'n_samples': n_samples
	}

	def _build_nn_meta_model(self, input_size: int):
	"""Build small neural network meta-learner."""
	class MetaNN(nn.Module):
	def __init__(self, input_size):
	super().__init__()
	self.net = nn.Sequential(
	nn.Linear(input_size, 64),
	nn.ReLU(),
	nn.Dropout(0.2),
	nn.Linear(64, 32),
	nn.ReLU(),
	nn.Linear(32, 1)
	)
	def forward(self, x):
	return self.net(x)
	return MetaNN(input_size).to(self.device)

	def _train_nn_meta(self, X: np.ndarray, y: np.ndarray, epochs: int = 50):
	"""Train NN meta-learner."""
	X_t = torch.FloatTensor(X).to(self.device)
	y_t = torch.FloatTensor(y).unsqueeze(1).to(self.device)

	optimizer = torch.optim.Adam(self.meta_model.parameters(), lr=1e-3)
	criterion = nn.MSELoss()

	for epoch in range(epochs):
	self.meta_model.train()
	optimizer.zero_grad()
	pred = self.meta_model(X_t)
	loss = criterion(pred, y_t)
	loss.backward()
	optimizer.step()

	def predict_meta(self,
	predictions: Dict[str, np.ndarray],
	regimes: Optional[List[str]] = None,
	volatilities: Optional[np.ndarray] = None) -> np.ndarray:
	"""Generate meta-model predictions."""
	if not self.is_fitted:
	# Fallback: equal weight
	preds = [predictions.get(m, np.zeros(len(list(predictions.values())[0])))
	for m in self.base_models]
	return np.mean(preds, axis=0)

	X_meta = self._build_meta_features(
	predictions,
	regime=regimes[0] if regimes else None,
	volatility=volatilities[0] if volatilities is not None else None
	)

	if self.meta_learner_type == 'nn':
	self.meta_model.eval()
	with torch.no_grad():
	X_t = torch.FloatTensor(X_meta).to(self.device)
	pred = self.meta_model(X_t).cpu().numpy().flatten()
	else:
	pred = self.meta_model.predict(X_meta)

	return pred

	def update_performance(self, model_name: str, prediction: np.ndarray, actual: np.ndarray):
	"""Update rolling performance history for a base model."""
	from scipy.stats import spearmanr
	ic, _ = spearmanr(prediction, actual)
	if np.isnan(ic):
	ic = 0.0
	self.performance_history[model_name].append(ic)
	# Keep only lookback window
	self.performance_history[model_name] = self.performance_history[model_name][-self.lookback_window:]

	def get_model_weights(self) -> Dict[str, float]:
	"""Get current implied weights from performance history."""
	weights = {}
	total_ic = 0
	for model in self.base_models:
	perf = self.performance_history.get(model, [0.0])
	avg_ic = np.mean(perf) if perf else 0.0
	# Use max(0, ic) to avoid negative weights, or use signed weights
	weight = max(avg_ic, 0.0)
	weights[model] = weight
	total_ic += weight

	if total_ic > 0:
	weights = {k: v / total_ic for k, v in weights.items()}
	else:
	# Equal weight fallback
	weights = {k: 1.0 / len(self.base_models) for k in self.base_models}

	return weights

	def adaptive_predict(self,
	predictions: Dict[str, np.ndarray],
	actual_prev: Optional[np.ndarray] = None,
	regime: Optional[str] = None) -> Tuple[np.ndarray, Dict[str, float]]:
	"""
	Adaptive prediction that updates weights based on recent performance.

	Returns:
	final_predictions, current_weights
	"""
	# Update performance if previous actuals available
	if actual_prev is not None:
	for model, pred in predictions.items():
	if len(pred) == len(actual_prev):
	self.update_performance(model, pred, actual_prev)

	# Get adaptive weights
	weights = self.get_model_weights()
	self.weight_history.append(weights)

	# Weighted combination
	final_pred = np.zeros(len(list(predictions.values())[0]))
	for model, weight in weights.items():
	if model in predictions:
	final_pred += weight * predictions[model]

	return final_pred, weights