Spaces:

akshay1306
/

contractpulse

Running

File size: 8,384 Bytes
import os
import pickle
import pandas as pd
from datetime import datetime
import yfinance as yf

# ═════════════════════════════════════════════════════════════════════════════
# CONFIGURATION
# ═════════════════════════════════════════════════════════════════════════════
MODEL_PATH = 'risk_model_v10_extended.pkl'
DATA_DIR   = '../data/Stocks'
FORECAST_PERIODS = 90

# ═════════════════════════════════════════════════════════════════════════════
# 1. CORE PIPELINE FUNCTIONS (Required for Frontend/Backend to use the model)
# ═════════════════════════════════════════════════════════════════════════════
def load_ticker_data(ticker, data_dir=None):
    """

    Load a single ticker from the local dataset.

    File format: Date,Open,High,Low,Close,Volume,OpenInt

    Returns a DataFrame with DatetimeIndex, columns [Close, Volume].

    """
    if data_dir is None:
        data_dir = DATA_DIR

    print(f"[Data] Fetching local dataset data for {ticker.upper()}...")
    
    candidates = [
        os.path.join(data_dir, f'{ticker}.us.txt'),
        os.path.join(data_dir, f'{ticker}.txt'),
        os.path.join(data_dir, f'{ticker.upper()}.us.txt'),
        os.path.join(data_dir, f'{ticker.upper()}.txt'),
    ]

    path = None
    for c in candidates:
        if os.path.isfile(c):
            path = c
            break

    if path is None:
        raise ValueError(f"Data file for {ticker} not found in {data_dir}. Please provide the dataset!")

    df = pd.read_csv(
        path,
        header=0,
        names=['Date', 'Open', 'High', 'Low', 'Close', 'Volume', 'OpenInt'],
        parse_dates=['Date'],
    )
    df = df[['Date', 'Close', 'Volume']].copy()
    df['Date'] = pd.to_datetime(df['Date'])
    df.set_index('Date', inplace=True)
    df.sort_index(inplace=True)

    # Drop duplicates on date index
    df = df[~df.index.duplicated(keep='first')]

    # Only keep rows where Close > 0
    df = df[df['Close'] > 0]
    
    # We keep the DatetimeIndex so we can align with Prophet forecasts
    # Normalize the index to remove time components
    if df.index.tz is not None:
        df.index = df.index.tz_localize(None)
    df.index = df.index.normalize()
    df.index.name = 'Date'
        
    return df

def build_risk_score(df: pd.DataFrame) -> pd.DataFrame:
    """Feature engineering logic (must perfectly match the training phase)."""
    fe = df.copy()
    fe['returns']    = fe['Close'].pct_change()
    fe['vol_14']     = fe['returns'].rolling(14).std()
    fe['momentum']   = fe['Close'] / fe['Close'].rolling(14).mean()
    fe['drawdown']   = fe['Close'] / fe['Close'].cummax()
    fe['returns_5d'] = fe['returns'].rolling(5).mean()
    fe['risk_raw'] = -fe['returns_5d'] + fe['vol_14'] * 2 + (1 - fe['drawdown'])
    fe.dropna(inplace=True)
    return fe[['Close', 'Volume', 'returns', 'vol_14', 'momentum', 'drawdown', 'returns_5d', 'risk_raw']]

# ═════════════════════════════════════════════════════════════════════════════
# 2. INFERENCE SCRIPT
# ═════════════════════════════════════════════════════════════════════════════
def run_inference():
    if not os.path.exists(MODEL_PATH):
        print(f"[!] Could not find {MODEL_PATH}!")
        print("Please run the final cell in your Jupyter Notebook first to generate this file.")
        return

    print(f"[+] Loading model artifact: {MODEL_PATH}")
    with open(MODEL_PATH, 'rb') as f:
        artifact = pickle.load(f)
    
    print(f"Artifact Version: {artifact['version']} (Exported: {artifact['export_date']})")
    tickers = list(artifact['models'].keys())
    print(f"Models available for {len(tickers)} companies: {tickers}\n")

    frontend_data = {}

    for ticker in tickers:
        print(f"[*] Analyzing {ticker}...")
        try:
            # 1. Load & Engineer Data
            df = load_ticker_data(ticker.lower(), DATA_DIR)
            fe = build_risk_score(df)
            
            # 2. Retrieve the specific model & scaler bounds from the artifact
            ticker_payload = artifact['models'][ticker]
            model     = ticker_payload['model']
            r_min     = ticker_payload['r_min']
            r_max     = ticker_payload['r_max']
            threshold = ticker_payload['threshold']
            
            # 3. Normalise using the loaded bounds
            def norm_apply(series):
                return (series - r_min) / (r_max - r_min + 1e-9)
            
            current_risk_raw = fe['risk_raw'].iloc[-1]
            current_risk_norm = norm_apply(current_risk_raw)
            
            # 4. Forecast using loaded Prophet model
            future = model.make_future_dataframe(periods=FORECAST_PERIODS, freq='B')
            forecast = model.predict(future)
            
            # 5. Detect Breach
            last_date = fe.index[-1]
            future_fc = forecast[forecast['ds'] > pd.Timestamp(last_date)]
            
            breach_detected = False
            days_to_breach = None
            confidence = "NONE"
            
            for conf, col in [('HIGH', 'yhat_lower'), ('MEDIUM', 'yhat'), ('LOW', 'yhat_upper')]:
                rows = future_fc[future_fc[col] > threshold]
                if not rows.empty:
                    breach_detected = True
                    confidence = conf
                    days_to_breach = max((rows.iloc[0]['ds'] - pd.Timestamp(last_date)).days, 0)
                    break
            
            # 6. Package cleanly for the frontend
            frontend_data[ticker] = {
                "last_update_date": str(last_date.date()),
                "current_price": round(fe['Close'].iloc[-1], 2),
                "risk_metrics": {
                    "current_score": round(current_risk_norm, 4),
                    "danger_threshold": round(threshold, 4),
                    "is_in_danger_zone": bool(current_risk_norm > threshold)
                },
                "forecast": {
                    "breach_predicted": breach_detected,
                    "estimated_days_to_breach": days_to_breach,
                    "confidence_level": confidence
                }
            }
            print(f"   [OK] Done. Score: {round(current_risk_norm, 4)} | Breach: {'YES' if breach_detected else 'NO'}")
            
        except Exception as e:
            print(f"   [ERROR] Failed to process {ticker}: {e}")

    # ═════════════════════════════════════════════════════════════════════════════
    # 3. MOCK FRONTEND API RESPONSE
    # ═════════════════════════════════════════════════════════════════════════════
    print("\n" + "="*80)
    print("[*] FRONTEND JSON PAYLOAD GENERATED")
    print("="*80)
    import json
    print(json.dumps(frontend_data, indent=2))
    
    # Save to a JSON file for the frontend devs to view
    with open('frontend_mock_api.json', 'w') as f:
        json.dump(frontend_data, f, indent=2)
    print("\n[OK] Saved full response to 'frontend_mock_api.json'")

if __name__ == "__main__":
    run_inference()