Spaces:

karimic
/

ai-code-detector

Sleeping

File size: 35,272 Bytes

"""
classifier.py
=============
Trenira Random Forest klasifikator na datasetu izvučenih značajki,
evaluira ga i sprema na disk za korištenje u web aplikaciji.

Pokretanje (treniranje):
    python classifier.py

Korištenje iz drugog fajla (predikcija):
    from classifier import predict
    result = predict(code="def foo(x): return x", language="python")
    print(result["ai_probability"])   # npr. 0.73
    print(result["verdict"])          # "Vjerojatno AI"
    print(result["top_features"])     # koje značajke su bile ključne
"""

import os
import csv
import pickle
import warnings
warnings.filterwarnings("ignore")

import numpy as np
from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import train_test_split, cross_val_score
from sklearn.metrics import (
    classification_report,
    confusion_matrix,
    roc_auc_score,
    precision_recall_curve,
)
from sklearn.preprocessing import StandardScaler
from sklearn.calibration import CalibratedClassifierCV

from feature_extraction import extract_all_features


# ─────────────────────────────────────────────────────────────────────────────
# KONFIGURACIJA
# ─────────────────────────────────────────────────────────────────────────────

DATASET_PATH  = os.path.join("data", "dataset.csv")
MODEL_DIR     = "model"
MODEL_PATH    = os.path.join(MODEL_DIR, "classifier.pkl")
SCALER_PATH   = os.path.join(MODEL_DIR, "scaler.pkl")
FEATURES_PATH = os.path.join(MODEL_DIR, "feature_names.pkl")

# Kolone koje ne koristimo kao značajke za treniranje
IGNORED_COLUMNS = {"label", "source", "detected_language", "model_available"}

# Značajka perplexity je -1.0 kad model nije učitan — tretiramo kao missing
PERPLEXITY_MISSING = -1.0

# Random Forest parametri
RF_PARAMS = {
    "n_estimators":  300,
    "max_depth":     None,
    "min_samples_leaf": 2,
    # Dajemo veću kaznu za lažno pozitivne (nevin student označen kao AI)
    # {0: 1.0, 1: 0.8} znači da je greška na human klasi 1.25x skuplja od greške na AI klasi
    # "balanced" automatski kompenzira neravnotežu klasa
    # Human dobiva veći težinski faktor jer je manjina (29% vs 71%)
    "class_weight": "balanced",
    # Uz to koristimo max_features za bolju generalizaciju
    "max_features": "sqrt",
    "random_state":  42,
    "n_jobs":       -1,
}

# Prag ispod kojeg smatramo kod "premalog" za pouzdanu analizu
MINIMUM_LINES = 5

# Prag vjerojatnosti — konzervativniji pragovi smanjuju lažno pozitivne
THRESHOLDS = {
    "likely_ai":    0.80,   # gore → "Vjerojatno AI"
    "possible_ai":  0.65,   # gore → "Moguće AI"
    "unclear":      0.45,   # gore → "Nejasno"
    "possible_human": 0.25, # gore → "Moguće čovječji"
    # ispod → "Vjerojatno čovječji"
}


# ─────────────────────────────────────────────────────────────────────────────
# UČITAVANJE DATASETA
# ─────────────────────────────────────────────────────────────────────────────

def ucitaj_dataset(path: str):
    """
    Učitava dataset.csv i vraća feature matricu X i vektor oznaka y.

    Tretira -1.0 vrijednosti (perplexity bez modela) kao 0.0
    jer klasifikator ne smije vidjeti negativne vrijednosti kao signal.

    Parametri:
        path (str): Putanja do CSV datoteke.

    Vraća:
        X (np.ndarray):         Matrica značajki oblika (n_samples, n_features).
        y (np.ndarray):         Vektor oznaka (0=human, 1=ai).
        feature_names (list):   Nazivi stupaca koji odgovaraju stupcima X.
    """
    if not os.path.exists(path):
        raise FileNotFoundError(
            f"Dataset nije pronađen na '{path}'.\n"
            f"Pokreni prvo: python download_dataset.py"
        )

    redovi = []
    with open(path, "r", encoding="utf-8") as f:
        reader = csv.DictReader(f)
        for row in reader:
            redovi.append(row)

    if not redovi:
        raise ValueError("Dataset je prazan.")

    # Odredi nazive značajki (svi stupci osim ignoriranih)
    sve_kolone = list(redovi[0].keys())
    feature_names = [c for c in sve_kolone if c not in IGNORED_COLUMNS]

    X_rows = []
    y_list = []

    for row in redovi:
        try:
            y_list.append(int(row["label"]))

            # Pretvori svaku značajku u float
            # Perplexity -1.0 → 0.0 (nije dostupan, ne smije biti signal)
            vrijednosti = []
            for feat in feature_names:
                val = float(row[feat])
                if feat == "perplexity" and val == PERPLEXITY_MISSING:
                    val = 0.0
                vrijednosti.append(val)

            X_rows.append(vrijednosti)

        except (ValueError, KeyError):
            continue   # preskoči neispravne retke

    X = np.array(X_rows, dtype=np.float32)
    y = np.array(y_list, dtype=np.int32)

    print(f"  Učitano {len(y)} primjera, {len(feature_names)} značajki")
    print(f"  Human (0): {sum(y == 0)}  |  AI (1): {sum(y == 1)}")

    return X, y, feature_names


# ─────────────────────────────────────────────────────────────────────────────
# TRENIRANJE
# ─────────────────────────────────────────────────────────────────────────────

def treniraj(X, y, feature_names):
    """
    Trenira Random Forest klasifikator i vraća trenirani model zajedno
    sa scalerom i rezultatima evaluacije.

    Pipeline:
        1. Podijeli podatke 80% trening / 20% test
        2. Normalizira značajke (StandardScaler)
        3. Trenira Random Forest
        4. Evaluira na test skupu
        5. Pokreće 5-fold cross-validation za pouzdaniju procjenu

    Parametri:
        X (np.ndarray):       Matrica značajki.
        y (np.ndarray):       Vektor oznaka.
        feature_names (list): Nazivi značajki.

    Vraća:
        model:   Trenirani RandomForestClassifier.
        scaler:  Trenirani StandardScaler.
        metrics: Rječnik s metrikama evaluacije.
    """
    # 1. Podjela na trening i test skup
    X_train, X_test, y_train, y_test = train_test_split(
        X, y, test_size=0.2, random_state=42, stratify=y
        # stratify=y osigurava da i trening i test imaju isti omjer klasa
    )
    print(f"\n  Trening: {len(y_train)} primjera")
    print(f"  Test:    {len(y_test)} primjera")

    # 2. Normalizacija — StandardScaler svaku značajku svede na
    #    srednju vrijednost 0 i standardnu devijaciju 1.
    #    VAŽNO: scaler se fitira SAMO na trening skupu,
    #    a transformira i trening i test (da ne bi "curilo" znanje)
    scaler = StandardScaler()
    X_train_scaled = scaler.fit_transform(X_train)
    X_test_scaled  = scaler.transform(X_test)

    # 3. Treniranje Random Foresta + kalibracija vjerojatnosti
    # CalibratedClassifierCV popravlja iskrivljene vjerojatnosti RF-a.
    # Bez kalibracije, RF može davati 60% za nešto što je zapravo 30%.
    # method='isotonic' je jači, ali treba više podataka (>1000 primjera — ok)
    print("\n  Treniram Random Forest + kalibriram vjerojatnosti...")
    base_model = RandomForestClassifier(**RF_PARAMS)
    model = CalibratedClassifierCV(base_model, method='isotonic', cv=3)
    model.fit(X_train_scaled, y_train)

    # 4. Evaluacija na test skupu
    y_pred      = model.predict(X_test_scaled)
    y_pred_prob = model.predict_proba(X_test_scaled)[:, 1]

    print("\n" + "─" * 50)
    print("  REZULTATI EVALUACIJE")
    print("─" * 50)
    print(classification_report(
        y_test, y_pred,
        target_names=["Human (0)", "AI (1)"],
        digits=3
    ))

    # Matrica zabune — pokazuje lažno pozitivne i lažno negativne
    cm = confusion_matrix(y_test, y_pred)
    tn, fp, fn, tp = cm.ravel()
    print(f"  Matrica zabune:")
    print(f"    Ispravno human:      {tn}  (true negative)")
    print(f"    Lažno označen AI:    {fp}  (false positive)")
    print(f"    Propušten AI:        {fn}  (false negative)")
    print(f"    Ispravno AI:         {tp}  (true positive)\n")

    # AUC-ROC — mjera kvalitete rankiranja (0.5=slučajno, 1.0=savršeno)
    auc = roc_auc_score(y_test, y_pred_prob)
    print(f"  AUC-ROC: {auc:.4f}")

    # 5. Pronalazi optimalni prag odluke koji maksimizira F1 za human klasu
    # Cilj: smanjiti lažno pozitivne (FP) čak i ako propustimo koji AI
    precisions, recalls, thresholds = precision_recall_curve(
        y_test, y_pred_prob, pos_label=0  # gledamo human klasu (0)
    )
    # Tražimo prag gdje je precision za human >= 0.85
    # (tj. kad kažemo "human", u barem 85% slučajeva stvarno je human)
    optimal_threshold = 0.5  # fallback
    for prec, rec, thr in zip(precisions, recalls, thresholds):
        if prec >= 0.85 and rec >= 0.30:
            optimal_threshold = thr
            break

    print(f"\n  Optimalni prag odluke za AI klasu: {1 - optimal_threshold:.2f}")
    print(f"  (Prag ispod kojeg klasificiramo kao Human)")

    # Spremi optimalni prag uz model
    threshold_path = os.path.join(MODEL_DIR, "threshold.pkl")
    os.makedirs(MODEL_DIR, exist_ok=True)
    with open(threshold_path, "wb") as f_thr:
        pickle.dump(float(1 - optimal_threshold), f_thr)

    # 6. Cross-validation s miješanjem — pouzdanija procjena
    # StratifiedKFold + shuffle sprječava situaciju gdje jedna fold
    # sadrži samo jedan tip podataka (npr. samo AIGCodeSet)
    from sklearn.model_selection import StratifiedKFold
    print("\n  5-fold cross-validation (može potrajati minutu)...")
    X_scaled_full = scaler.transform(X)
    skf = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
    cv_scores = cross_val_score(
        model, X_scaled_full, y,
        cv=skf, scoring="f1", n_jobs=-1
    )
    print(f"  CV F1 scores: {[f'{s:.3f}' for s in cv_scores]}")
    print(f"  CV F1 prosjek: {cv_scores.mean():.3f} "
          f"(±{cv_scores.std():.3f})")

    # Top 10 najvažnijih značajki
    # CalibratedClassifierCV omotava base estimator, pa trebamo
    # dohvatiti feature_importances_ iz jednog od kalibriranih estimatora
    try:
        base_rf = model.calibrated_classifiers_[0].estimator
        importances = base_rf.feature_importances_
    except Exception:
        # Fallback ako struktura nije očekivana
        importances = np.zeros(len(feature_names))

    top_idx = np.argsort(importances)[::-1][:10]
    print("\n  Top 10 najvažnijih značajki:")
    for rank, idx in enumerate(top_idx, 1):
        print(f"    {rank:2}. {feature_names[idx]:<38} {importances[idx]:.4f}")

    metrics = {
        "auc_roc":    auc,
        "cv_f1_mean": cv_scores.mean(),
        "cv_f1_std":  cv_scores.std(),
        "true_negative":   int(tn),
        "false_positive":  int(fp),
        "false_negative":  int(fn),
        "true_positive":   int(tp),
    }

    return model, scaler, metrics


# ─────────────────────────────────────────────────────────────────────────────
# SPREMANJE MODELA
# ─────────────────────────────────────────────────────────────────────────────

def spremi_model(model, scaler, feature_names):
    """
    Sprema trenirani model, scaler i listu naziva značajki na disk.

    Sva tri fajla su potrebna za predikciju:
      - model     : donosi odluku
      - scaler    : normalizira ulaz na isti način kao pri treniranju
      - feature_names : osigurava da se značajke šalju u ispravnom redoslijedu

    Parametri:
        model:          Trenirani RandomForestClassifier.
        scaler:         Trenirani StandardScaler.
        feature_names:  Lista naziva značajki.
    """
    os.makedirs(MODEL_DIR, exist_ok=True)

    THRESHOLD_PATH = os.path.join(MODEL_DIR, "threshold.pkl")

    with open(MODEL_PATH,     "wb") as f: pickle.dump(model,         f)
    with open(SCALER_PATH,    "wb") as f: pickle.dump(scaler,        f)
    with open(FEATURES_PATH,  "wb") as f: pickle.dump(feature_names, f)

    print(f"\n  Model spremljen u:          {MODEL_PATH}")
    print(f"  Scaler spremljen u:         {SCALER_PATH}")
    print(f"  Nazivi značajki spremljeni: {FEATURES_PATH}")
    if os.path.exists(THRESHOLD_PATH):
        with open(THRESHOLD_PATH, "rb") as f:
            thr = pickle.load(f)
        print(f"  Optimalni prag:             {thr:.2f}")


# ─────────────────────────────────────────────────────────────────────────────
# PREDIKCIJA — koristi se iz web aplikacije
# ─────────────────────────────────────────────────────────────────────────────

def ucitaj_model():
    """
    Učitava model, scaler, nazive značajki i optimalni prag s diska.
    Poziva se jednom pri pokretanju web servera.

    Vraća:
        (model, scaler, feature_names, threshold) ili
        (None, None, None, 0.65) ako model ne postoji.
    """
    THRESHOLD_PATH = os.path.join(MODEL_DIR, "threshold.pkl")

    if not all(os.path.exists(p) for p in [MODEL_PATH, SCALER_PATH, FEATURES_PATH]):
        return None, None, None, 0.65

    with open(MODEL_PATH,    "rb") as f: model         = pickle.load(f)
    with open(SCALER_PATH,   "rb") as f: scaler        = pickle.load(f)
    with open(FEATURES_PATH, "rb") as f: feature_names = pickle.load(f)

    threshold = 0.65  # konzervativni default
    if os.path.exists(THRESHOLD_PATH):
        with open(THRESHOLD_PATH, "rb") as f:
            threshold = pickle.load(f)

    return model, scaler, feature_names, threshold



# ─────────────────────────────────────────────────────────────────────────────
# GENERIRANJE OBJAŠNJENJA
# ─────────────────────────────────────────────────────────────────────────────

def generate_explanations(features: dict, ai_prob: float) -> list:
    """
    Generira listu objašnjenja na engleskom jeziku koja opisuju
    zašto kod izgleda AI generiran ili čovječji.

    Svako objašnjenje je rječnik s:
      "text"     — rečenica objašnjenja
      "severity" — "high" | "medium" | "low" | "positive"
      "feature"  — naziv značajke na koju se objašnjenje odnosi

    Pragovi su kalibrirani na temelju tipičnih vrijednosti u
    AI-Detector i HMCorp datasetovima.

    Parametri:
        features (dict): Rječnik značajki iz extract_all_features().
        ai_prob (float): Vjerojatnost AI podrijetla (0.0 – 1.0).

    Vraća:
        list: Lista rječnika s objašnjenjima, sortirana po ozbiljnosti.
    """
    objasnjenja = []

    def dodaj(text, severity, feature):
        objasnjenja.append({"text": text, "severity": severity, "feature": feature})

    # ── IMENOVANJE ─────────────────────────────────────────────────────────

    avg_id_len = features.get("avg_identifier_length", 0)
    if avg_id_len > 7.5:
        dodaj(
            f"Identifier names are unusually long and descriptive "
            f"(average {avg_id_len:.1f} characters). "
            f"AI-generated code consistently favours verbose, self-documenting names "
            f"such as 'calculate_average_value' over typical student shorthand like 'avg'.",
            "high", "avg_identifier_length"
        )
    elif avg_id_len > 5.5:
        dodaj(
            f"Identifier names are moderately long (average {avg_id_len:.1f} characters), "
            f"which is slightly above the typical range for human-written student code.",
            "medium", "avg_identifier_length"
        )
    elif avg_id_len < 2.5 and avg_id_len > 0:
        dodaj(
            f"Identifier names are very short (average {avg_id_len:.1f} characters), "
            f"consistent with a human programmer's preference for concise variable names.",
            "positive", "avg_identifier_length"
        )

    naming_cons = features.get("naming_consistency", 0)
    if naming_cons > 0.85:
        dodaj(
            f"Naming convention is highly consistent throughout the submission "
            f"({naming_cons * 100:.0f}% of identifiers follow the same pattern). "
            f"Human programmers typically mix conventions, especially in longer submissions.",
            "high", "naming_consistency"
        )
    elif naming_cons < 0.3 and naming_cons > 0:
        dodaj(
            f"Naming convention varies across the submission, which is characteristic "
            f"of code written incrementally by a human programmer.",
            "positive", "naming_consistency"
        )

    single_char = features.get("single_char_name_ratio", 0)
    if single_char < 0.03 and features.get("num_functions", 0) > 1:
        dodaj(
            f"No single-character variable names were detected. "
            f"Human programmers routinely use short names such as 'i', 'x', or 'n' "
            f"in loops and helper functions; their absence is atypical.",
            "medium", "single_char_name_ratio"
        )
    elif single_char > 0.25:
        dodaj(
            f"A notable proportion of variables use single-character names "
            f"({single_char * 100:.0f}%), which is common in human-written code.",
            "positive", "single_char_name_ratio"
        )

    # ── KOMENTARI I DOCSTRINGOVI ───────────────────────────────────────────

    comment_ratio = features.get("comment_ratio", 0)
    if comment_ratio > 0.30:
        dodaj(
            f"Comment density is substantially above average — "
            f"{comment_ratio * 100:.0f}% of lines contain inline comments. "
            f"AI models tend to annotate nearly every logical step, "
            f"whereas students typically comment only non-obvious sections.",
            "high", "comment_ratio"
        )
    elif comment_ratio > 0.18:
        dodaj(
            f"Comment density ({comment_ratio * 100:.0f}% of lines) is higher than "
            f"typically observed in student submissions at this level.",
            "medium", "comment_ratio"
        )
    elif comment_ratio < 0.03:
        dodaj(
            f"Very few or no inline comments are present, which is more consistent "
            f"with human-written code at this stage of the course.",
            "positive", "comment_ratio"
        )

    num_docs = features.get("num_docstrings", 0)
    # Aproksimiramo broj funkcija iz function_density i total_lines
    # jer structural features sada vraćaju gustoće, ne apsolutne brojeve
    fn_density  = features.get("function_density", 0)
    total_lines = features.get("total_lines", 1)
    num_fns_est = max(1, round(fn_density * total_lines))

    if num_docs > 0:
        doc_coverage = num_docs / max(num_fns_est, 1)
        if num_docs >= 3 and doc_coverage >= 0.8:
            dodaj(
                f"Every function in the submission includes a formal docstring "
                f"({num_docs} docstrings detected). "
                f"Complete docstring coverage is a strong marker of AI-generated code; "
                f"students rarely document all functions unless explicitly required.",
                "high", "num_docstrings"
            )
        elif num_docs >= 2:
            dodaj(
                f"Multiple functions include docstrings ({num_docs} detected), "
                f"which is above the typical student average.",
                "medium", "num_docstrings"
            )

    # ── STRUKTURNE ZNAČAJKE ────────────────────────────────────────────────

    avg_fn_len = features.get("avg_function_length", 0)
    if avg_fn_len > 20:
        dodaj(
            f"Functions are notably long on average ({avg_fn_len:.0f} lines per function). "
            f"AI models tend to produce complete, self-contained implementations; "
            f"students more often break logic across multiple smaller functions "
            f"or leave parts incomplete.",
            "medium", "avg_function_length"
        )
    elif 0 < avg_fn_len < 6:
        dodaj(
            f"Functions are concise on average ({avg_fn_len:.1f} lines), "
            f"which is consistent with a human programmer's incremental coding style.",
            "positive", "avg_function_length"
        )

    try_density = features.get("try_density", 0)
    if try_density > 0.06:
        dodaj(
            f"The submission contains a relatively high density of try/except blocks. "
            f"Comprehensive error handling across all edge cases is a pattern "
            f"commonly exhibited by AI generators, which anticipate and handle "
            f"exceptions that students typically overlook.",
            "medium", "try_density"
        )

    nesting = features.get("max_nesting_depth", 0)
    if nesting > 5:
        dodaj(
            f"Code nesting reaches a depth of {int(nesting)} levels. "
            f"While not conclusive, deeply nested logic can reflect an AI model's "
            f"tendency to handle all conditional branches explicitly.",
            "medium", "max_nesting_depth"
        )

    # ── STATISTIČKA ANALIZA ────────────────────────────────────────────────

    token_entropy = features.get("token_entropy", 0)
    if token_entropy > 0 and token_entropy < 3.8:
        dodaj(
            f"Token entropy is low ({token_entropy:.2f}), indicating that the vocabulary "
            f"of the submission is repetitive and predictable. "
            f"This is consistent with language model output, which tends to reuse "
            f"the same phrasing and structural patterns.",
            "high", "token_entropy"
        )
    elif token_entropy > 5.5:
        dodaj(
            f"Token entropy is relatively high ({token_entropy:.2f}), suggesting "
            f"a diverse and varied vocabulary more typical of human authorship.",
            "positive", "token_entropy"
        )

    perplexity = features.get("perplexity", -1)
    if perplexity != -1 and perplexity > 0:
        if perplexity < 8:
            dodaj(
                f"The code's perplexity score is very low ({perplexity:.1f}), meaning "
                f"a language model finds the token sequence highly predictable. "
                f"This strongly suggests the code was generated by a similar model.",
                "high", "perplexity"
            )
        elif perplexity < 20:
            dodaj(
                f"Perplexity ({perplexity:.1f}) falls within a range that is "
                f"moderately consistent with AI-generated code.",
                "medium", "perplexity"
            )
        elif perplexity > 50:
            dodaj(
                f"Perplexity is high ({perplexity:.1f}), indicating the code "
                f"contains patterns that a language model would consider unexpected — "
                f"a characteristic of human authorship.",
                "positive", "perplexity"
            )

    # ── FORMATIRANJE ───────────────────────────────────────────────────────

    trailing = features.get("trailing_whitespace_ratio", 0)
    if trailing > 0.15:
        dodaj(
            f"A notable proportion of lines contain trailing whitespace "
            f"({trailing * 100:.0f}%), which is typical of code edited by hand "
            f"and inconsistent with AI-generated output.",
            "positive", "trailing_whitespace_ratio"
        )

    op_cons = features.get("operator_spacing_consistency", 0)
    if op_cons > 0.95:
        dodaj(
            f"Spacing around operators is perfectly consistent throughout the submission. "
            f"AI models apply style conventions uniformly; human programmers "
            f"occasionally deviate, particularly under time pressure.",
            "medium", "operator_spacing_consistency"
        )

    # Ako nema signala, dodaj neutralnu poruku
    if not objasnjenja:
        if ai_prob > 0.5:
            dodaj(
                "No single dominant signal was identified; the classification is based "
                "on a combination of subtle stylistic and structural patterns.",
                "medium", "combined"
            )
        else:
            dodaj(
                "No strong AI-generation markers were detected. "
                "The submission's style and structure are consistent with human authorship.",
                "positive", "combined"
            )

    # Sortiraj: high → medium → positive/low
    priority = {"high": 0, "medium": 1, "low": 2, "positive": 3}
    objasnjenja.sort(key=lambda x: priority.get(x["severity"], 2))

    return objasnjenja


def predict(code: str, language: str = None, filename: str = None,
            model=None, scaler=None, feature_names=None, threshold: float = None) -> dict:
    """
    Analizira isječak koda i vraća procjenu vjerojatnosti AI podrijetla.

    Ako model/scaler/feature_names nisu proslijeđeni, automatski ih učita s diska.

    Parametri:
        code (str):          Izvorni kod za analizu.
        language (str):      Programski jezik (opcionalno, automatska detekcija).
        filename (str):      Ime datoteke (opcionalno, pomaže detekciji jezika).
        model:               Učitani model (opcionalno, za višekratnu upotrebu).
        scaler:              Učitani scaler (opcionalno).
        feature_names (list):Lista naziva značajki (opcionalno).

    Vraća:
        dict s ključevima:
            "ai_probability"  – float 0.0-1.0, vjerojatnost AI podrijetla
            "verdict"         – string s tumačenjem rezultata
            "detected_language" – prepoznati programski jezik
            "top_features"    – lista (naziv, vrijednost) top 5 značajki
            "all_features"    – rječnik svih izvučenih značajki
            "error"           – string s greškom, ili None ako je sve OK
    """
    # Učitaj model ako nije proslijeđen
    if model is None:
        model, scaler, feature_names, threshold = ucitaj_model()
    else:
        threshold = 0.65  # konzervativni default ako je model proslijeđen direktno

    if model is None:
        return {
            "ai_probability":     None,
            "verdict":            "Model nije dostupan",
            "detected_language":  None,
            "top_features":       [],
            "all_features":       {},
            "error": "Model nije treniran. Pokreni: python classifier.py"
        }

    # Provjera minimalne duljine — kratki kodovi nemaju dovoljno signala
    # za pouzdanu analizu i skloni su lažno pozitivnim rezultatima
    meaningful_lines = len([l for l in code.splitlines() if l.strip()])
    if meaningful_lines < MINIMUM_LINES:
        return {
            "ai_probability":    None,
            "verdict":           "Premalo koda za analizu",
            "detected_language": None,
            "top_features":      [],
            "all_features":      {},
            "error": (
                f"Analiza zahtijeva najmanje {MINIMUM_LINES} nepraznih linija koda. "
                f"Predani isječak ima {meaningful_lines} "
                f"({'liniju' if meaningful_lines == 1 else 'linije' if meaningful_lines < 5 else 'linija'})."
            )
        }

    # Izvuci značajke
    sve_znacajke = extract_all_features(
        code=code, language=language, filename=filename
    )

    # Složi feature vektor u TOČNO isti redosljed kao pri treniranju
    feature_vector = []
    for feat in feature_names:
        val = sve_znacajke.get(feat, 0.0)
        if feat == "perplexity" and val == PERPLEXITY_MISSING:
            val = 0.0
        feature_vector.append(float(val))

    X = np.array([feature_vector], dtype=np.float32)
    X_scaled = scaler.transform(X)

    # Predikcija
    ai_prob = float(model.predict_proba(X_scaled)[0][1])

    # Tumačenje — koristimo optimalni prag pronađen pri treniranju
    # Sve iznad threshold-a ide prema "AI", sve ispod prema "Human"
    ai_cutoff = threshold  # npr. 0.68 pronađen automatski
    if ai_prob >= min(ai_cutoff + 0.15, 0.90):
        verdict = "Vjerojatno AI"
    elif ai_prob >= ai_cutoff:
        verdict = "Moguće AI"
    elif ai_prob >= ai_cutoff - 0.20:
        verdict = "Nejasno"
    elif ai_prob >= ai_cutoff - 0.40:
        verdict = "Moguće čovječji"
    else:
        verdict = "Vjerojatno čovječji"

    # Top 5 značajki koje su doprinijele odluci
    # Dohvati importances iz base estimatora unutar CalibratedClassifierCV
    try:
        base_rf = model.calibrated_classifiers_[0].estimator
        importances = base_rf.feature_importances_
    except Exception:
        importances = np.ones(len(feature_names)) / len(feature_names)
    top_idx = np.argsort(importances)[::-1][:5]
    top_features = [
        {
            "name":       feature_names[i],
            "value":      round(feature_vector[i], 4),
            "importance": round(float(importances[i]), 4),
        }
        for i in top_idx
    ]

    # Generiraj objašnjenja zašto je kod klasificiran ovako
    objasnjenja = generate_explanations(sve_znacajke, ai_prob)

    return {
        "ai_probability":    round(ai_prob, 4),
        "verdict":           verdict,
        "detected_language": sve_znacajke.get("detected_language", "nepoznat"),
        "top_features":      top_features,
        "all_features":      sve_znacajke,
        "explanations":      objasnjenja,
        "error":             None,
    }


# ─────────────────────────────────────────────────────────────────────────────
# GLAVNI PROGRAM
# ─────────────────────────────────────────────────────────────────────────────

def main():
    print("=" * 50)
    print("  Treniranje klasifikatora")
    print("=" * 50)

    # Učitaj dataset
    print(f"\n  Učitavam dataset iz '{DATASET_PATH}'...")
    X, y, feature_names = ucitaj_dataset(DATASET_PATH)

    # ── UNDERSAMPLING ──────────────────────────────────────────────────────
    # Balansiramo klase uzimanjem max 3x više human primjera nego AI.
    # Bez ovoga model s 63:1 omjerom gotovo uvijek predviđa human.
    # Cilj: human ≈ 2-3x AI → model nauči obje klase jednako dobro.

    n_ai    = int(np.sum(y == 1))
    n_human = int(np.sum(y == 0))
    target_human = min(n_human, n_ai * 3)   # max 3x više human nego AI

    if n_human > target_human:
        print(f"\n  Undersampling: {n_human} → {target_human} human primjera")
        print(f"  (zadržavamo svih {n_ai} AI + {target_human} human = "
              f"{n_ai + target_human} ukupno, omjer {target_human//n_ai}:1)")

        rng = np.random.default_rng(42)
        human_idx = np.where(y == 0)[0]
        ai_idx    = np.where(y == 1)[0]

        # Nasumično uzimamo target_human primjera iz human klase
        chosen_human = rng.choice(human_idx, size=target_human, replace=False)

        # Spajamo s AI primjerima i miješamo
        all_idx = np.concatenate([chosen_human, ai_idx])
        rng.shuffle(all_idx)

        X = X[all_idx]
        y = y[all_idx]
        print(f"  Nakon undersamplinga: Human={int(np.sum(y==0))}, "
              f"AI={int(np.sum(y==1))}, Ukupno={len(y)}")
    # ──────────────────────────────────────────────────────────────────────

    # Treniraj
    model, scaler, metrics = treniraj(X, y, feature_names)

    # Spremi
    spremi_model(model, scaler, feature_names)

    # Brzi test predikcije
    print("\n" + "─" * 50)
    print("  BRZI TEST PREDIKCIJE")
    print("─" * 50)

    test_kodovi = {
        "AI Python": '''
def calculate_fibonacci(n: int) -> list:
    """
    Generate a Fibonacci sequence up to n terms.

    Args:
        n: The number of terms to generate.

    Returns:
        A list containing the Fibonacci sequence.
    """
    if n <= 0:
        raise ValueError("Number of terms must be positive.")
    fibonacci_sequence = [0, 1]
    for i in range(2, n):
        next_value = fibonacci_sequence[i - 1] + fibonacci_sequence[i - 2]
        fibonacci_sequence.append(next_value)
    return fibonacci_sequence[:n]
''',
        "Human Python": '''
def fib(n):
    # quick fib
    a, b = 0, 1
    res = []
    for _ in range(n):
        res.append(a)
        a, b = b, a+b
    return res
''',
    }

    for naziv, kod in test_kodovi.items():
        rezultat = predict(kod, model=model, scaler=scaler,
                          feature_names=feature_names)
        prob = rezultat["ai_probability"]
        verdict = rezultat["verdict"]
        lang = rezultat["detected_language"]
        print(f"\n  [{naziv}]")
        print(f"    Jezik:           {lang}")
        print(f"    AI vjerojatnost: {prob:.1%}")
        print(f"    Zaključak:       {verdict}")
        print(f"    Ključne značajke:")
        for feat in rezultat["top_features"]:
            print(f"      {feat['name']:<35} vrijednost={feat['value']:.4f}")

    print("\n" + "=" * 50)
    print("  Treniranje završeno.")
    print("  Sljedeći korak: python app.py")
    print("=" * 50)


if __name__ == "__main__":
    main()