"""
Model Manager for HMM-SVR Trading Models
Handles training, saving, loading, and prediction for live trading.
Models are persisted to disk for Hugging Face Spaces cold start handling.
"""
import os
import joblib
import numpy as np
import pandas as pd
import yfinance as yf
from datetime import datetime, timedelta
from typing import Optional, Dict, Tuple, Any
from hmmlearn.hmm import GaussianHMM
from sklearn.svm import SVR
from sklearn.preprocessing import StandardScaler
from binance.client import Client
from dotenv import load_dotenv

load_dotenv()

# Directory for storing trained models
MODEL_DIR = os.path.join(os.path.dirname(__file__), 'models')
os.makedirs(MODEL_DIR, exist_ok=True)

# Global cache for loaded models (survives until Space sleeps)
_model_cache: Dict[str, Dict[str, Any]] = {}


def get_model_path(symbol: str) -> str:
    """Get the file path for a symbol's model."""
    # Normalize symbol (e.g., BTCUSDT -> btcusdt)
    return os.path.join(MODEL_DIR, f'{symbol.lower()}_hmm_svr.pkl')


def is_model_trained(symbol: str) -> bool:
    """Check if a model exists for the given symbol."""
    return os.path.exists(get_model_path(symbol))


def get_model_info(symbol: str) -> Optional[Dict]:
    """Get metadata about a trained model."""
    model_path = get_model_path(symbol)
    if not os.path.exists(model_path):
        return None
    
    try:
        model_data = joblib.load(model_path)
        return {
            'symbol': symbol,
            'trained_at': model_data.get('trained_at', 'Unknown'),
            'n_states': model_data.get('n_states', 3),
            'avg_train_vol': model_data.get('avg_train_vol', 0),
            'train_days': model_data.get('train_days', 0),
        }
    except Exception as e:
        print(f"[ModelManager] Error reading model info for {symbol}: {e}")
        return None


def fetch_training_data_yfinance(ticker: str, years: int = 4) -> Optional[pd.DataFrame]:
    """
    Fetch historical daily data from Yahoo Finance for training.
    Converts Binance symbols (e.g., BTCUSDT) to Yahoo format (BTC-USD).
    """
    # Convert Binance symbol to Yahoo Finance format
    yahoo_ticker = ticker.replace('USDT', '-USD').replace('BUSD', '-USD')
    
    end_date = datetime.now()
    start_date = end_date - timedelta(days=years * 365)
    
    print(f"[ModelManager] Fetching {years} years of data for {yahoo_ticker}...")
    
    try:
        df = yf.download(yahoo_ticker, start=start_date, end=end_date, progress=False, auto_adjust=True)
        
        if df.empty:
            print(f"[ModelManager] No data returned for {yahoo_ticker}")
            return None
        
        # Handle MultiIndex columns from yfinance
        if isinstance(df.columns, pd.MultiIndex):
            if 'Close' in df.columns.get_level_values(0):
                df.columns = df.columns.get_level_values(0)
            else:
                df.columns = df.columns.get_level_values(1)
        
        print(f"[ModelManager] Fetched {len(df)} days of data")
        return df.dropna()
    except Exception as e:
        print(f"[ModelManager] Error fetching data: {e}")
        return None


def fetch_training_data_binance(symbol: str, days: int = 1460) -> Optional[pd.DataFrame]:
    """
    Fetch historical daily data from Binance for training.
    Falls back to this if yfinance fails.
    """
    try:
        client = Client()  # No API keys needed for public data
        
        # Calculate start time
        end_time = datetime.now()
        start_time = end_time - timedelta(days=days)
        
        print(f"[ModelManager] Fetching {days} days of Binance data for {symbol}...")
        
        klines = client.get_historical_klines(
            symbol=symbol,
            interval=Client.KLINE_INTERVAL_1DAY,
            start_str=start_time.strftime('%Y-%m-%d'),
            end_str=end_time.strftime('%Y-%m-%d')
        )
        
        if not klines:
            print(f"[ModelManager] No Binance data returned for {symbol}")
            return None
        
        df = pd.DataFrame(klines, columns=[
            'timestamp', 'Open', 'High', 'Low', 'Close', 'Volume',
            'close_time', 'quote_volume', 'trades', 'taker_buy_base',
            'taker_buy_quote', 'ignore'
        ])
        
        df['timestamp'] = pd.to_datetime(df['timestamp'], unit='ms')
        df.set_index('timestamp', inplace=True)
        df['Close'] = df['Close'].astype(float)
        df['Open'] = df['Open'].astype(float)
        df['High'] = df['High'].astype(float)
        df['Low'] = df['Low'].astype(float)
        df['Volume'] = df['Volume'].astype(float)
        
        print(f"[ModelManager] Fetched {len(df)} days from Binance")
        return df[['Open', 'High', 'Low', 'Close', 'Volume']].dropna()
    except Exception as e:
        print(f"[ModelManager] Error fetching Binance data: {e}")
        return None


def engineer_features(df: pd.DataFrame) -> pd.DataFrame:
    """
    Apply feature engineering as defined in strategy.py.
    """
    df = df.copy()
    
    # Log returns
    df['Log_Returns'] = np.log(df['Close'] / df['Close'].shift(1))
    
    # Rolling volatility (10-day)
    df['Volatility'] = df['Log_Returns'].rolling(window=10).std()
    
    # Downside volatility (std of negative returns only)
    df['Downside_Returns'] = df['Log_Returns'].apply(lambda x: x if x < 0 else 0)
    df['Downside_Vol'] = df['Downside_Returns'].rolling(10).std()
    
    # Target for SVR: next day's volatility
    df['Target_Next_Vol'] = df['Volatility'].shift(-1)
    
    return df.dropna()


def train_hmm_model(train_df: pd.DataFrame, n_states: int = 3) -> Tuple[GaussianHMM, Dict[int, int]]:
    """
    Train HMM on historical data and sort states by volatility.
    State 0 = Lowest Volatility (Safe)
    State N-1 = Highest Volatility (Crash)
    """
    X_train = train_df[['Log_Returns', 'Volatility']].values * 100
    
    model = GaussianHMM(n_components=n_states, covariance_type="full", n_iter=100, random_state=42)
    model.fit(X_train)
    
    # Calculate average volatility per state
    hidden_states = model.predict(X_train)
    state_vol = []
    for i in range(n_states):
        mask = hidden_states == i
        if mask.sum() > 0:
            avg_vol = X_train[mask, 1].mean()
        else:
            avg_vol = 0
        state_vol.append((i, avg_vol))
    
    # Sort states by volatility: State 0 = Lowest, State N-1 = Highest
    state_vol.sort(key=lambda x: x[1])
    mapping = {old: new for new, (old, _) in enumerate(state_vol)}
    
    return model, mapping


def train_svr_model(train_df: pd.DataFrame) -> Tuple[SVR, StandardScaler]:
    """
    Train SVR to predict next day's volatility.
    """
    feature_cols = ['Log_Returns', 'Volatility', 'Downside_Vol', 'Regime']
    target_col = 'Target_Next_Vol'
    
    X = train_df[feature_cols].values
    y = train_df[target_col].values
    
    scaler = StandardScaler()
    X_scaled = scaler.fit_transform(X)
    
    model = SVR(kernel='rbf', C=100, gamma=0.1, epsilon=0.01)
    model.fit(X_scaled, y)
    
    return model, scaler


def train_and_save_model(symbol: str, n_states: int = 3, binance_symbol: str = None, save_as: str = None) -> Dict[str, Any]:
    """
    Train HMM-SVR models for a symbol and save to disk.
    Returns training results and metadata.
    
    Args:
        symbol: Base symbol (e.g., 'BTC') or Yahoo Finance format (e.g., 'BTC-USD')
        n_states: Number of HMM states (default 3)
        binance_symbol: Full Binance symbol (e.g., 'BTCUSDT') for fallback, optional
        save_as: Base symbol to use for saving model (e.g., 'BTC'). If not provided, 
                 will auto-detect from symbol by stripping USDT/-USD suffixes
    """
    # Auto-detect base symbol for saving if not provided
    # Handles: BTCUSDT -> BTC, BTC-USD -> BTC, BTC -> BTC
    if save_as is None:
        save_as = symbol.replace('USDT', '').replace('-USD', '')
    
    print(f"\n{'='*60}")
    print(f"[ModelManager] Training HMM-SVR model for {save_as}")
    print(f"{'='*60}")
    
    # Try Yahoo Finance first, then Binance
    df = fetch_training_data_yfinance(symbol)
    if df is None or len(df) < 250:
        print("[ModelManager] Falling back to Binance data...")
        # Use full Binance symbol if provided, otherwise reconstruct it
        fallback_symbol = binance_symbol if binance_symbol else f"{save_as}USDT"
        df = fetch_training_data_binance(fallback_symbol)
    
    if df is None or len(df) < 250:
        return {"error": f"Insufficient data for {save_as}. Need at least 250 days, got {len(df) if df is not None else 0}."}
    
    # Engineer features
    df = engineer_features(df)
    
    if len(df) < 200:
        return {"error": f"Insufficient data after feature engineering for {save_as}. Got {len(df)} days."}
    
    print(f"[ModelManager] Training on {len(df)} days of data...")
    
    # Train HMM
    print("[ModelManager] Training HMM model...")
    hmm_model, state_mapping = train_hmm_model(df, n_states=n_states)
    
    # Apply regime labels to training data
    X_train = df[['Log_Returns', 'Volatility']].values * 100
    raw_states = hmm_model.predict(X_train)
    df['Regime'] = [state_mapping[s] for s in raw_states]
    
    # Calculate average training volatility for risk ratio
    avg_train_vol = df['Volatility'].mean()
    
    # Train SVR
    print("[ModelManager] Training SVR model...")
    svr_model, svr_scaler = train_svr_model(df)
    
    # Prepare model data for saving (use save_as for consistent base symbol)
    model_data = {
        'hmm_model': hmm_model,
        'svr_model': svr_model,
        'svr_scaler': svr_scaler,
        'state_mapping': state_mapping,
        'avg_train_vol': avg_train_vol,
        'n_states': n_states,
        'train_days': len(df),
        'trained_at': datetime.now().isoformat(),
        'symbol': save_as
    }
    
    # Save to disk using base symbol (e.g., BTC not BTCUSDT or BTC-USD)
    model_path = get_model_path(save_as)
    joblib.dump(model_data, model_path)
    
    # Update cache with base symbol
    _model_cache[save_as.upper()] = model_data
    
    print(f"[ModelManager] ✅ Model saved to {model_path}")
    print(f"[ModelManager] States: 0=Low Vol (Safe), {n_states-1}=High Vol (Crash)")
    print(f"[ModelManager] Avg training volatility: {avg_train_vol:.6f}")
    
    return {
        "success": True,
        "symbol": save_as,
        "trained_at": model_data['trained_at'],
        "train_days": len(df),
        "avg_train_vol": avg_train_vol,
        "n_states": n_states,
        "model_path": model_path
    }


def load_model(symbol: str) -> Optional[Dict[str, Any]]:
    """
    Load a trained model from disk into memory.
    Returns None if model doesn't exist.
    """
    symbol_upper = symbol.upper()
    
    # Check cache first
    if symbol_upper in _model_cache:
        print(f"[ModelManager] Using cached model for {symbol}")
        return _model_cache[symbol_upper]
    
    # Load from disk
    model_path = get_model_path(symbol)
    if not os.path.exists(model_path):
        print(f"[ModelManager] No model found for {symbol} at {model_path}")
        return None
    
    try:
        print(f"[ModelManager] Loading model from {model_path}...")
        model_data = joblib.load(model_path)
        _model_cache[symbol_upper] = model_data
        print(f"[ModelManager] ✅ Model loaded for {symbol}")
        return model_data
    except Exception as e:
        print(f"[ModelManager] Error loading model: {e}")
        return None


def load_all_models() -> Dict[str, bool]:
    """
    Load all available models from disk into cache.
    Called on application startup.
    """
    print("\n[ModelManager] Loading all models from disk...")
    results = {}
    
    if not os.path.exists(MODEL_DIR):
        print("[ModelManager] No models directory found")
        return results
    
    for filename in os.listdir(MODEL_DIR):
        if filename.endswith('_hmm_svr.pkl'):
            symbol = filename.replace('_hmm_svr.pkl', '').upper()
            model = load_model(symbol)
            results[symbol] = model is not None
    
    print(f"[ModelManager] Loaded {sum(results.values())} models: {list(results.keys())}")
    return results


def predict_regime_and_volatility(
    symbol: str,
    recent_data: pd.DataFrame
) -> Optional[Dict[str, Any]]:
    """
    Use trained model to predict current regime and next volatility.
    
    Args:
        symbol: Trading symbol (e.g., BTCUSDT)
        recent_data: DataFrame with recent price data (needs Close column)
    
    Returns:
        Dict with regime, predicted_vol, risk_ratio, etc.
    """
    model_data = load_model(symbol)
    if model_data is None:
        return {"error": f"No model found for {symbol}. Train it first."}
    
    hmm_model = model_data['hmm_model']
    svr_model = model_data['svr_model']
    svr_scaler = model_data['svr_scaler']
    state_mapping = model_data['state_mapping']
    avg_train_vol = model_data['avg_train_vol']
    n_states = model_data['n_states']
    
    # Engineer features on recent data
    df = engineer_features(recent_data)
    
    if len(df) < 20:
        return {"error": "Insufficient recent data for prediction"}
    
    # Predict regime using HMM on recent window
    lookback = min(252, len(df))  # Use up to 1 year of data
    recent_window = df.iloc[-lookback:]
    
    X_hmm = recent_window[['Log_Returns', 'Volatility']].values * 100
    hidden_states = hmm_model.predict(X_hmm)
    current_state_raw = hidden_states[-1]
    current_regime = state_mapping.get(current_state_raw, current_state_raw)
    
    # Get latest row for SVR prediction
    latest = df.iloc[-1]
    
    # Predict next volatility using SVR
    svr_features = np.array([[
        latest['Log_Returns'],
        latest['Volatility'],
        latest['Downside_Vol'],
        current_regime
    ]])
    svr_features_scaled = svr_scaler.transform(svr_features)
    predicted_vol = svr_model.predict(svr_features_scaled)[0]
    
    # Calculate risk ratio
    risk_ratio = predicted_vol / avg_train_vol if avg_train_vol > 0 else 1.0
    
    return {
        'regime': int(current_regime),
        'regime_label': 'Safe' if current_regime == 0 else ('Crash' if current_regime == n_states - 1 else 'Normal'),
        'predicted_vol': float(predicted_vol),
        'current_vol': float(latest['Volatility']),
        'risk_ratio': float(risk_ratio),
        'avg_train_vol': float(avg_train_vol),
        'n_states': n_states,
        'log_return': float(latest['Log_Returns']),
        'close_price': float(latest['Close'])
    }


def calculate_signal_and_position(
    symbol: str,
    recent_data: pd.DataFrame,
    short_window: int = 12,
    long_window: int = 26,
    lookback_window: int = 252
) -> Optional[Dict[str, Any]]:
    """
    Calculate trading signal and position sizing with walk-forward logic.
    Enhanced to match backtest methodology more closely.
    
    Returns:
        Dict with signal, target_position_size, regime info, stability metrics, etc.
    """
    # Get regime and volatility prediction
    prediction = predict_regime_and_volatility(symbol, recent_data)
    if prediction is None or 'error' in prediction:
        return prediction
    
    model_data = load_model(symbol)
    n_states = model_data['n_states']
    
    # Use sliding window for EMA calculation (matches backtest)
    df = recent_data.copy()
    lookback_data = df.iloc[-lookback_window:] if len(df) > lookback_window else df
    
    # Calculate EMAs on sliding window only (not full history)
    lookback_data_copy = lookback_data.copy()
    lookback_data_copy['EMA_Short'] = lookback_data_copy['Close'].ewm(span=short_window).mean()
    lookback_data_copy['EMA_Long'] = lookback_data_copy['Close'].ewm(span=long_window).mean()
    
    latest = lookback_data_copy.iloc[-1]
    
    # EMA Crossover Signal (1 = bullish, 0 = bearish)
    ema_signal = 1 if latest['EMA_Short'] > latest['EMA_Long'] else 0
    
    # Calculate signal stability (how long has signal been consistent?)
    if len(lookback_data_copy) >= 5:
        recent_5_days = lookback_data_copy.tail(5)
        recent_signals = (recent_5_days['EMA_Short'] > recent_5_days['EMA_Long']).astype(int)
        signal_stability = recent_signals.sum() / 5.0  # 1.0 = all bullish, 0.0 = all bearish
    else:
        signal_stability = 0.5
    
    # Determine position size based on regime and risk
    regime = prediction['regime']
    risk_ratio = prediction['risk_ratio']
    
    # Enhanced 5-level leverage logic:
    # - 0x: Crash regime OR bearish trend
    # - 0.5x: High risk in normal regime (defensive)
    # - 1x: Standard bullish position
    # - 2x: Safe regime with moderate risk OR normal regime with low risk
    # - 3x: Safe regime + very low risk (sniper mode)
    
    position_size = 1.0  # Default: Standard position
    
    # Debug logging to verify conditions
    print(f"[Leverage Logic] {symbol}: Regime={regime}/{n_states-1}, Risk={risk_ratio:.3f}, EMA_Signal={ema_signal}")
    
    # CRASH PROTOCOL: Override to 0x if crash regime detected
    if regime == n_states - 1:
        position_size = 0.0
        print(f"[Leverage Logic] {symbol}: CRASH REGIME → 0x position")
    
    # SAFE REGIME (Lowest volatility)
    elif regime == 0:
        if risk_ratio < 0.5:
            position_size = 3.0  # 🚀 SNIPER MODE
            print(f"[Leverage Logic] {symbol}: SNIPER MODE (Safe + Very Low Risk) → 3x")
        elif risk_ratio < 0.85:
            position_size = 2.0  # 📈 Strong position
            print(f"[Leverage Logic] {symbol}: Safe + Moderate Risk → 2x")
        else:
            position_size = 1.0  # ✅ Standard
            print(f"[Leverage Logic] {symbol}: Safe + High Risk → 1x")
    
    # NORMAL REGIME (Middle volatility)
    elif regime == 1:
        if risk_ratio < 0.5:
            position_size = 2.0  # 📈 Favorable
            print(f"[Leverage Logic] {symbol}: Normal + Low Risk → 2x")
        elif risk_ratio > 1.2:
            position_size = 0.5  # ⚠️ Defensive
            print(f"[Leverage Logic] {symbol}: Normal + High Risk → 0.5x (defensive)")
        else:
            position_size = 1.0  # ✅ Standard
            print(f"[Leverage Logic] {symbol}: Normal + Moderate Risk → 1x")
    
    # Otherwise: Standard 1x position (if bullish) or 0x (if bearish)
    
    # Target position = Signal * Position Size
    # Signal of 0 means no position regardless of size
    target_position = ema_signal * position_size
    
    # Enhanced reasoning with stability context
    reasoning = _get_signal_reasoning(
        ema_signal, regime, risk_ratio, position_size, n_states, signal_stability
    )
    
    return {
        'ema_signal': ema_signal,
        'ema_short': float(latest['EMA_Short']),
        'ema_long': float(latest['EMA_Long']),
        'regime': regime,
        'regime_label': prediction['regime_label'],
        'predicted_vol': prediction['predicted_vol'],
        'risk_ratio': risk_ratio,
        'position_size_multiplier': position_size,
        'target_position': target_position,  # 0, 1, or 3
        'close_price': float(latest['Close']),
        'signal_stability': signal_stability,  # NEW: How stable is the signal?
        'reasoning': reasoning,
        'ema_gap_percent': ((latest['EMA_Short'] - latest['EMA_Long']) / latest['EMA_Long'] * 100)  # NEW: Strength of trend
    }


def _get_signal_reasoning(ema_signal: int, regime: int, risk_ratio: float, 
                          position_size: float, n_states: int, signal_stability: float = 0.5) -> str:
    """Generate human-readable reasoning for the signal with stability context."""
    reasons = []
    
    # EMA reasoning with stability
    if ema_signal == 1:
        stability_text = "STRONG" if signal_stability > 0.8 else ("WEAK" if signal_stability < 0.4 else "MODERATE")
        reasons.append(f"✅ Trend UP (12-EMA > 26-EMA) [{stability_text}]")
    else:
        stability_text = "STRONG" if signal_stability < 0.2 else ("WEAK" if signal_stability > 0.6 else "MODERATE")
        reasons.append(f"📉 Trend DOWN (12-EMA < 26-EMA) [{stability_text}]")
    
    # Regime reasoning
    if regime == 0:
        reasons.append("🛡️ Safe Regime (Low Volatility)")
    elif regime == n_states - 1:
        reasons.append("🚨 CRASH REGIME (High Volatility)")
    else:
        reasons.append(f"⚖️ Normal Regime (Neutral Volatility)")
    
    # Risk reasoning
    if risk_ratio < 0.5:
        reasons.append(f"🌤️ Future Looks Calm (risk: {risk_ratio:.2f})")
    elif risk_ratio > 1.5:
        reasons.append(f"⚠️ High Future Risk (risk: {risk_ratio:.2f})")
    else:
        reasons.append(f"📊 Normal Risk (ratio: {risk_ratio:.2f})")
    
    # Position reasoning with enhanced logic
    if position_size == 3.0:
        reasons.append("→ 🚀 MAX LEVERAGE 3x (Sniper Mode!)")
    elif position_size == 2.0:
        reasons.append("→ 📈 MEDIUM LEVERAGE 2x (Favorable)")
    elif position_size == 1.0:
        reasons.append("→ ✅ Standard 1x Position")
    elif position_size == 0.5:
        reasons.append("→ ⚠️ REDUCED 0.5x (Defensive)")
    elif position_size == 0.0:
        if regime == n_states - 1:
            reasons.append("→ 🛑 CASH (Crash Protocol Override)")
        else:
            reasons.append("→ 🛑 CASH (Bearish Trend)")
    else:
        reasons.append(f"→ Position: {position_size:.1f}x")
    
    return " | ".join(reasons)


def get_cached_models() -> Dict[str, Dict]:
    """Get info about all cached models."""
    return {
        symbol: {
            'trained_at': data.get('trained_at', 'Unknown'),
            'n_states': data.get('n_states', 3),
            'avg_train_vol': data.get('avg_train_vol', 0),
            'train_days': data.get('train_days', 0)
        }
        for symbol, data in _model_cache.items()
    }