File size: 9,702 Bytes

"""
Key Rank Evaluation
===================
Computes the key rank metric used to evaluate side-channel attack models.
Matches the methodology from the official ASCAD evaluation scripts.

The key rank measures how many key candidates score higher than the correct
key when accumulating log-likelihood scores over increasing numbers of
attack traces. A rank of 0 means the correct key is the top candidate.
"""

import logging
from typing import Dict, Optional, Tuple

import numpy as np
import tensorflow as tf

from .constants import AES_SBOX

logger = logging.getLogger(__name__)


def bits_to_byte_probs(bit_predictions: np.ndarray) -> np.ndarray:
    """
    Convert 8 independent bit probabilities into 256 joint byte probabilities.

    For multi-bit models (Wu et al., TCHES 2024), each byte is predicted as
    8 independent bits. To compute key rank, we need to reconstruct the
    256-class probability distribution.

    For byte value v with bits b_0..b_7:
        P(v) = prod_j P(b_j=bit_j(v))

    where P(b_j=1) = bit_predictions[j] and P(b_j=0) = 1 - bit_predictions[j].

    Args:
        bit_predictions: Model output, shape (N, 8), values in [0, 1].

    Returns:
        Byte probabilities, shape (N, 256), rows sum to 1.
    """
    N = bit_predictions.shape[0]
    byte_probs = np.ones((N, 256), dtype=np.float64)

    # Pre-compute bit patterns for all 256 byte values
    byte_values = np.arange(256, dtype=np.uint8)
    # bit_patterns[v, j] = j-th bit of value v (MSB first to match np.unpackbits)
    bit_patterns = np.unpackbits(byte_values[:, np.newaxis], axis=1)  # (256, 8)

    for j in range(8):
        p_j = bit_predictions[:, j:j+1].astype(np.float64)  # (N, 1)
        # For each byte value, multiply by P(b_j=bit_j(v))
        # bit_patterns[:, j] is 0 or 1 for each of 256 values
        mask = bit_patterns[:, j].astype(np.float64)  # (256,)
        # P(b_j = mask[v]) = mask[v]*p_j + (1-mask[v])*(1-p_j)
        byte_probs *= mask[np.newaxis, :] * p_j + (1 - mask[np.newaxis, :]) * (1 - p_j)

    # Normalize to ensure rows sum to 1 (handle numerical precision)
    row_sums = byte_probs.sum(axis=1, keepdims=True)
    row_sums = np.maximum(row_sums, 1e-300)  # prevent division by zero
    byte_probs /= row_sums

    return byte_probs


def compute_key_rank(
    predictions: np.ndarray,
    metadata: np.ndarray,
    real_key: int,
    target_byte: int,
    num_traces: Optional[int] = None,
    rank_step: int = 10,
) -> Tuple[np.ndarray, int]:
    """
    Compute the key rank over an increasing number of attack traces.

    For each key candidate k in [0..255], the log-likelihood score is:
        score[k] = sum_i log( predictions[i][ Sbox(plaintext_i XOR k) ] )

    The rank of the real key is its position when candidates are sorted
    by descending score.

    Args:
        predictions: Model output probabilities, shape (N, 256).
        metadata: Structured array with 'plaintext' and 'key' fields.
        real_key: The true key byte value (0-255).
        target_byte: Index of the target byte (0-15).
        num_traces: Number of attack traces to use (default: all).
        rank_step: Step size for computing intermediate ranks.

    Returns:
        Tuple of (ranks_array, final_rank).
        ranks_array: shape (M, 2) with columns [num_traces, rank].
        final_rank: The key rank using all traces.
    """
    if num_traces is None:
        num_traces = len(predictions)
    num_traces = min(num_traces, len(predictions))

    log_scores = np.zeros(256, dtype=np.float64)
    ranks_list = []

    for i in range(num_traces):
        plaintext_byte = metadata[i]["plaintext"][target_byte]

        for k in range(256):
            sbox_out = AES_SBOX[plaintext_byte ^ k]
            prob = predictions[i][sbox_out]
            if prob > 0:
                log_scores[k] += np.log(prob)
            else:
                # Back-off: use square of minimum non-zero probability
                non_zero = predictions[i][predictions[i] > 0]
                if len(non_zero) > 0:
                    log_scores[k] += np.log(np.min(non_zero) ** 2)

        if (i + 1) % rank_step == 0:
            rank = _rank_of_key(log_scores, real_key)
            ranks_list.append([i + 1, rank])

    ranks_array = np.array(ranks_list, dtype=np.uint32) if ranks_list else np.empty((0, 2), dtype=np.uint32)
    final_rank = _rank_of_key(log_scores, real_key)

    return ranks_array, final_rank


def _rank_of_key(log_scores: np.ndarray, real_key: int) -> int:
    """Compute the rank of the real key in the sorted score list."""
    sorted_scores = np.sort(log_scores)[::-1]
    real_score = log_scores[real_key]
    rank = int(np.where(sorted_scores == real_score)[0][0])
    return rank


def _get_rank_at_n(ranks_array: np.ndarray, n: int) -> int:
    """Get the rank at exactly n traces, or the closest available."""
    if len(ranks_array) == 0:
        return 256
    idx = np.where(ranks_array[:, 0] == n)[0]
    if len(idx) > 0:
        return int(ranks_array[idx[0], 1])
    before = ranks_array[ranks_array[:, 0] <= n]
    if len(before) > 0:
        return int(before[-1, 1])
    return int(ranks_array[0, 1])


def evaluate_model(
    model: tf.keras.Model,
    attack_traces: np.ndarray,
    attack_metadata: np.ndarray,
    target_byte: int,
    real_key: int,
    model_type: str = "mlp",
    num_traces: int = 2000,
    rank_step: int = 10,
    output_index: Optional[int] = None,
    cached_predictions: Optional[Dict] = None,
) -> Dict:
    """
    Run the full key rank evaluation on a trained model.

    Args:
        model: Trained Keras model.
        attack_traces: Raw attack traces, shape (N, trace_length).
        attack_metadata: Structured metadata array.
        target_byte: Target key byte index (0-15).
        real_key: True key byte value (0-255).
        model_type: 'mlp', 'cnn', or 'mtan' (determines input reshaping).
        num_traces: Number of attack traces to evaluate.
        rank_step: Step size for intermediate rank computation.
        output_index: For multi-output models (MTAN), the index of the
            output to evaluate. If None, the model is assumed single-output.
        cached_predictions: Optional pre-computed predictions dict from a
            single model.predict() call. When provided, skips the forward
            pass entirely. This avoids redundant forward passes when
            evaluating all 16 bytes of a multi-output model.

    Returns:
        Dictionary with evaluation results:
            'final_rank', 'ranks', 'pre_rank', 'min_rank', 'max_rank',
            'rank_at_500', 'rank_at_1000'.
    """
    if cached_predictions is not None:
        raw_predictions = cached_predictions
    else:
        traces = attack_traces[:num_traces].copy()

        # Reshape for CNN/MTAN (add channel dimension)
        if model_type in ("cnn", "mtan"):
            traces = traces.reshape((traces.shape[0], traces.shape[1], 1))

        raw_predictions = model.predict(traces, batch_size=256, verbose=0)

    # For multi-output models, extract the specific task's predictions.
    # Keras returns a dict when model outputs are named (e.g. {'byte_0': ..., 'byte_1': ...}).
    # It may also return a list for unnamed multi-output models.
    if output_index is not None:
        if isinstance(raw_predictions, dict):
            key = f"byte_{output_index}"
            if key in raw_predictions:
                predictions = raw_predictions[key]
            else:
                # Fallback: try by position in dict values
                predictions = list(raw_predictions.values())[output_index]
        elif isinstance(raw_predictions, (list, tuple)):
            predictions = raw_predictions[output_index]
        else:
            predictions = raw_predictions
    else:
        predictions = raw_predictions

    # Ensure predictions is a numpy array
    if not isinstance(predictions, np.ndarray):
        predictions = np.array(predictions)

    # Multi-bit mode: convert (N, 8) bit predictions to (N, 256) byte probs
    if predictions.ndim == 2 and predictions.shape[1] == 8:
        logger.info(
            "Multi-bit predictions detected (shape %s), converting to byte probs",
            predictions.shape,
        )
        predictions = bits_to_byte_probs(predictions)

    if predictions.ndim != 2 or predictions.shape[1] != 256:
        raise ValueError(
            f"Expected predictions shape (N, 256) or (N, 8), got {predictions.shape}. "
            f"raw_predictions type={type(raw_predictions).__name__}, "
            f"output_index={output_index}"
        )

    ranks_array, final_rank = compute_key_rank(
        predictions=predictions,
        metadata=attack_metadata[:num_traces],
        real_key=real_key,
        target_byte=target_byte,
        num_traces=num_traces,
        rank_step=rank_step,
    )

    min_rank = int(np.min(ranks_array[:, 1])) if len(ranks_array) > 0 else 256
    max_rank = int(np.max(ranks_array[:, 1])) if len(ranks_array) > 0 else 256
    pre_rank = int(ranks_array[0, 1]) if len(ranks_array) > 0 else 256
    rank_at_500 = _get_rank_at_n(ranks_array, 500)
    rank_at_1000 = _get_rank_at_n(ranks_array, 1000)

    result = {
        "final_rank": final_rank,
        "ranks": ranks_array,
        "pre_rank": pre_rank,
        "min_rank": min_rank,
        "max_rank": max_rank,
        "rank_at_500": rank_at_500,
        "rank_at_1000": rank_at_1000,
    }

    logger.info(
        "Byte %d: pre_rank=%d, final_rank=%d, min_rank=%d, max_rank=%d, "
        "rank@500=%d, rank@1000=%d",
        target_byte, pre_rank, final_rank, min_rank, max_rank,
        rank_at_500, rank_at_1000,
    )
    return result