Spaces:

CognitiveEngineering
/

ai-model-xray

Sleeping

App Files Files Community

ai-model-xray / analysis.py

CognitiveEngineering

Deploy AI Model X-Ray - structural health scanner

451cf40 verified 19 days ago

Raw

History Blame Contribute Delete

19.8 kB

	"""Structural-health backend for AI Model X-Ray.

	Extracts attention-head connectivity graphs from any HuggingFace transformer and
	computes the spectral simplicial hierarchy per layer:

	lambda2(T(G)) <= lambda2(G) (and the chain lambda2(T3) <= lambda2(T(G)) <= lambda2(G))

	The graph / hierarchy / fragility math is ported verbatim from the validated
	Modal experiments (`modal_jepa.py`, `modal_cross_arch.py`): lambda2 (algebraic
	connectivity), triangle_graph T(G), the fragility index FI (fraction of edges in
	zero triangles) and the per-layer `hierarchy` record. Only the surrounding
	plumbing — model-type detection, per-layer regime classification, the precomputed
	reference cache and the `scan_model` entry point — is new here.

	Each layer is classified into a pruning regime from its coherence ratio
	rho = lambda2(T(G)) / lambda2(G) and its FI:

	immune rho > 0.8 and FI == 0 triangle-redundant -> safe to prune
	buffer 0.5 <= rho <= 0.8 partial redundancy -> prune with caution
	critical rho < 0.5 low redundancy -> do not prune
	(layers where T(G) is disconnected have rho undefined -> treated as buffer)
	"""
	from __future__ import annotations

	import json
	import os
	import statistics

	# --------------------------------------------------------------------------- #
	# Constants
	# --------------------------------------------------------------------------- #
	TOL = 1e-9
	THRESHOLD = 0.3 # Pearson r edge threshold (matches the reference runs)
	SCALING_FACTOR = 500.0 # structural-integrity gauge: score = 100 - FI * factor

	HERE = os.path.dirname(os.path.abspath(__file__))
	CACHE_PATH = os.path.join(HERE, "data", "cross_architecture_spectral.json")

	# 16 diverse English sentences for text models (verbatim from modal_cross_arch).
	SENTENCES = [
	"The quick brown fox jumps over the lazy dog near the river.",
	"Scientists discovered a new species of butterfly in the rainforest.",
	"She carefully placed the fragile vase on the wooden shelf.",
	"Global markets rallied after the central bank cut interest rates.",
	"He learned to play the violin when he was only six years old.",
	"The ancient castle stood silently on the hill above the village.",
	"Machine learning models require large amounts of training data.",
	"A gentle breeze carried the scent of blossoms across the garden.",
	"The committee voted unanimously to approve the new budget proposal.",
	"Children laughed and played in the park on a sunny afternoon.",
	"The spacecraft entered orbit after a seven month journey to Mars.",
	"Fresh bread and strong coffee filled the small bakery with warmth.",
	"Engineers tested the bridge under heavy load before opening it.",
	"The novel explores themes of memory, loss, and the passage of time.",
	"Volunteers planted hundreds of trees along the eroding coastline.",
	"Quantum computers may one day solve problems classical machines cannot.",
	]

	# Pre-loaded models surfaced in the dropdown: id -> display metadata.
	PRELOADED = {
	"bert-base-uncased": {"label": "BERT", "type": "Encoder", "params": "110M", "cache_key": "BERT"},
	"gpt2": {"label": "GPT-2", "type": "Decoder", "params": "124M", "cache_key": "GPT-2"},
	"google/vit-base-patch16-224": {"label": "ViT", "type": "Vision", "params": "86M", "cache_key": "ViT"},
	"distilbert-base-uncased": {"label": "DistilBERT","type": "Encoder", "params": "66M", "cache_key": None},
	}


	# ========================================================================= #
	# Graph / hierarchy helpers (ported verbatim from modal_jepa.py)
	# ========================================================================= #
	def lambda2(G):
	"""Second-smallest Laplacian eigenvalue (algebraic connectivity) of G.
	Returns (val, connected, n). 0 exactly when G is disconnected."""
	import networkx as nx
	import numpy as np
	n = G.number_of_nodes()
	if n < 2:
	return None, False, n
	connected = nx.is_connected(G)
	if n <= 1800:
	L = nx.laplacian_matrix(G).toarray().astype(float)
	ev = np.linalg.eigvalsh(L)
	return float(ev[1]), connected, n
	from scipy.sparse.linalg import eigsh
	Ls = nx.laplacian_matrix(G).astype(float)
	try:
	ev = eigsh(Ls, k=2, sigma=1e-8, which="LM", return_eigenvectors=False)
	except Exception:
	ev = eigsh(Ls, k=2, which="SM", return_eigenvectors=False)
	return float(np.sort(ev)[1]), connected, n


	def _triangles(G, adj):
	seen = set()
	for v in G.nodes():
	nbrs = sorted(adj[v])
	for x in range(len(nbrs)):
	for y in range(x + 1, len(nbrs)):
	a, b = nbrs[x], nbrs[y]
	if b in adj[a]:
	tri = tuple(sorted((v, a, b)))
	if tri not in seen:
	seen.add(tri)
	yield tri


	def triangle_graph(G):
	"""T(G): nodes = edges of G; two edges adjacent iff they lie in a common
	triangle. Built by enumerating triangles."""
	import networkx as nx
	edges = [tuple(sorted(e)) for e in G.edges()]
	idx = {e: i for i, e in enumerate(edges)}
	T = nx.Graph()
	T.add_nodes_from(range(len(edges)))
	adj = {v: set(G.neighbors(v)) for v in G.nodes()}
	for a, b, c in _triangles(G, adj):
	e_ab, e_ac, e_bc = tuple(sorted((a, b))), tuple(sorted((a, c))), tuple(sorted((b, c)))
	i, j, k = idx[e_ab], idx[e_ac], idx[e_bc]
	T.add_edge(i, j); T.add_edge(i, k); T.add_edge(j, k)
	return T


	def compute_fi_from_adj(A):
	"""SAL fragility index: fraction of edges participating in zero triangles.
	A: n x n binary symmetric adjacency (no self-loops). High FI = fragile."""
	import numpy as np
	n = A.shape[0]
	if n < 2:
	return 0.0
	total = fragile = 0
	for i in range(n):
	row_i = A[i]
	for j in range(i + 1, n):
	if A[i, j]:
	total += 1
	if int(np.dot(row_i, A[j])) == 0:
	fragile += 1
	return 1.0 if total == 0 else fragile / total


	def graph_from_corr(C, threshold):
	"""Build a simple graph from a correlation matrix: edge iff C_ij > threshold."""
	import networkx as nx
	import numpy as np
	A = (C > threshold).astype(np.int8)
	np.fill_diagonal(A, 0)
	G = nx.from_numpy_array(A)
	return G, A


	def _density(G):
	n = G.number_of_nodes()
	if n < 2:
	return 0.0
	return 2.0 * G.number_of_edges() / (n * (n - 1))


	def _count_edges_triangles_capped(G, cap):
	adj = {v: set(G.neighbors(v)) for v in G.nodes()}
	c = 0
	for _ in _triangles(G, adj):
	c += 1
	if c > cap:
	return c
	return c


	def hierarchy(C, threshold, edge_cap=400, giant=False):
	"""Per-layer spectral-hierarchy record for a correlation matrix C.

	rho / violation are defined ONLY where both G and T(G) are connected
	(`eligible`). If the graph is too dense the threshold is raised in small
	steps so T(G) stays tractable; the threshold actually used is reported.
	`giant=True` evaluates the hierarchy on G's largest connected component."""
	import networkx as nx
	t = threshold
	bumped = False
	tri_cap = 4000
	while True:
	G, A = graph_from_corr(C, t)
	ntri = _count_edges_triangles_capped(G, tri_cap)
	if (G.number_of_edges() > edge_cap or ntri > tri_cap) and t < 0.95:
	t = round(t + 0.02, 4); bumped = True
	continue
	break

	fi = compute_fi_from_adj(A)
	n_comp = nx.number_connected_components(G) if G.number_of_nodes() else 0
	orig_nodes, orig_edges = G.number_of_nodes(), G.number_of_edges()
	if giant and orig_nodes >= 1 and not nx.is_connected(G):
	G = G.subgraph(max(nx.connected_components(G), key=len)).copy()

	l2G, gconn, gn = lambda2(G)
	TG = triangle_graph(G)
	tconn = TG.number_of_nodes() >= 2 and nx.is_connected(TG)
	l2TG, _, _ = lambda2(TG)
	eligible = bool(gconn and tconn)
	return {
	"threshold": t, "threshold_bumped": bumped, "giant": giant,
	"orig_nodes": int(orig_nodes), "orig_edges": int(orig_edges),
	"n_components": int(n_comp),
	"nodes": int(G.number_of_nodes()), "edges": int(G.number_of_edges()),
	"density": _density(G),
	"G_connected": bool(gconn),
	"TG_nodes": int(TG.number_of_nodes()), "TG_edges": int(TG.number_of_edges()),
	"TG_connected": bool(tconn),
	"eligible": eligible,
	"l2G": l2G, "l2TG": l2TG,
	"rho": (l2TG / l2G) if (eligible and l2G and l2G > TOL) else None,
	"fi": fi,
	"violation": bool(eligible and l2TG is not None and l2G is not None
	and l2TG - l2G > TOL),
	}


	# ========================================================================= #
	# Regime classification
	# ========================================================================= #
	def classify_regime(rec):
	"""Map a per-layer hierarchy record to a pruning regime.

	Returns one of 'immune' \| 'buffer' \| 'critical'. Layers whose triangle graph
	is disconnected (rho undefined) are treated as 'buffer' — partial structure,
	prune with caution."""
	rho = rec.get("rho")
	fi = rec.get("fi") or 0.0
	if rho is None:
	return "buffer"
	if rho > 0.8 and fi <= TOL:
	return "immune"
	if rho < 0.5:
	return "critical"
	return "buffer"


	REGIME_META = {
	"immune": {"label": "Immune", "color": "#10B981", "advice": "safe to prune"},
	"buffer": {"label": "Buffer", "color": "#EF9F27", "advice": "prune with caution"},
	"critical": {"label": "Critical", "color": "#E24B4A", "advice": "do not prune"},
	}


	def summarize(result):
	"""Collapse a scan result (per_layer + meta) into dashboard-ready aggregates."""
	pl = result["per_layer"]
	eligible = [r for r in pl if r["eligible"]]
	rhos = [r["rho"] for r in eligible if r["rho"] is not None]
	fis = [r["fi"] for r in pl if r["fi"] is not None]
	regimes = [classify_regime(r) for r in pl]

	rho_mean = statistics.mean(rhos) if rhos else None
	# Headline fragility = full-graph (global) base FI when available, else mean.
	fi_head = result.get("fi_base")
	if fi_head is None:
	fi_head = statistics.mean(fis) if fis else 0.0

	score = max(0.0, min(100.0, 100.0 - fi_head * SCALING_FACTOR))
	return {
	"n_layers": result["n_layers"],
	"n_heads": result["n_heads"],
	"n_immune": regimes.count("immune"),
	"n_buffer": regimes.count("buffer"),
	"n_critical": regimes.count("critical"),
	"n_eligible": len(eligible),
	"violations": sum(1 for r in eligible if r["violation"]),
	"rho_mean": rho_mean,
	"rho_min": min(rhos) if rhos else None,
	"rho_max": max(rhos) if rhos else None,
	"fi_head": fi_head,
	"score": score,
	"regimes": regimes,
	}


	def score_band(score):
	"""(label, color) for the structural-integrity gauge value."""
	if score >= 92:
	return "Over-redundant", "#10B981"
	if score >= 80:
	return "Healthy", "#10B981"
	if score >= 50:
	return "Buffer zone", "#EF9F27"
	return "Critical", "#E24B4A"


	# ========================================================================= #
	# Precomputed reference cache
	# ========================================================================= #
	_CACHE = None


	def _load_cache():
	global _CACHE
	if _CACHE is None:
	with open(CACHE_PATH, encoding="utf-8") as f:
	_CACHE = json.load(f)
	return _CACHE


	def reference_rows():
	"""The architecture-comparison table rows (I-JEPA, BERT, GPT-2, ViT)."""
	cache = _load_cache()
	return list(cache["comparison"])


	def cached_result(model_id):
	"""Return a scan-shaped result for a pre-loaded model from the cache, or None
	if the model has no precomputed block (e.g. DistilBERT -> needs a live scan)."""
	meta = PRELOADED.get(model_id)
	if not meta or not meta.get("cache_key"):
	return None
	cache = _load_cache()
	block = cache["models"].get(meta["cache_key"])
	if block is None:
	return None
	return {
	"model_id": model_id,
	"label": meta["label"],
	"arch": meta["type"],
	"modality": block["modality"],
	"n_layers": block["n_layers"],
	"n_heads": block["n_heads"],
	"hidden": block["hidden"],
	"params": meta["params"],
	"per_layer": block["per_layer"],
	"fi_base": block["masking"]["base_fi"],
	"source": "cached",
	}


	# ========================================================================= #
	# Live attention extraction + scan
	# ========================================================================= #
	def _detect_modality(config):
	"""Classify a loaded model as 'vision' \| 'decoder' \| 'encoder'."""
	arch = " ".join(getattr(config, "architectures", None) or []).lower()
	mt = (getattr(config, "model_type", "") or "").lower()
	if "vit" in mt or "vit" in arch or "image" in mt or getattr(config, "image_size", None):
	return "vision"
	if getattr(config, "is_decoder", False) or "gpt" in mt or "llama" in mt \
	or "causal" in arch or "lmhead" in arch:
	return "decoder"
	return "encoder"


	def _arch_label(modality):
	return {"vision": "Vision", "decoder": "Decoder", "encoder": "Encoder"}[modality]


	def _corr(M):
	import numpy as np
	C = np.corrcoef(M)
	return np.nan_to_num(C, nan=0.0)


	def _extract_text(model_id, dev, max_length=32):
	import numpy as np
	import torch
	from transformers import AutoModel, AutoTokenizer
	tok = AutoTokenizer.from_pretrained(model_id)
	if tok.pad_token is None:
	tok.pad_token = tok.eos_token
	model = AutoModel.from_pretrained(
	model_id, attn_implementation="eager", torch_dtype=torch.float32)
	model.to(dev).eval()
	cfg = model.config
	n_layers, n_heads = cfg.num_hidden_layers, cfg.num_attention_heads
	acc = None; seq_len = None; count = 0
	for s in range(0, len(SENTENCES), 4):
	batch = SENTENCES[s:s + 4]
	inp = tok(batch, return_tensors="pt", padding="max_length",
	truncation=True, max_length=max_length).to(dev)
	with torch.no_grad():
	out = model(**inp, output_attentions=True)
	atts = out.attentions
	if atts is None or atts[0] is None:
	raise RuntimeError(f"{model_id} returned no attentions")
	if acc is None:
	seq_len = atts[0].shape[-1]
	acc = np.zeros((n_layers, n_heads, seq_len, seq_len), dtype=np.float64)
	for L in range(n_layers):
	acc[L] += atts[L].sum(dim=0).float().cpu().numpy()
	count += len(batch)
	acc /= count
	return acc, n_layers, n_heads, int(cfg.hidden_size), int(seq_len)


	def _extract_vision(model_id, dev, num_samples=16):
	import numpy as np
	import torch
	from transformers import AutoImageProcessor, AutoModel
	proc = AutoImageProcessor.from_pretrained(model_id)
	model = AutoModel.from_pretrained(
	model_id, attn_implementation="eager", torch_dtype=torch.float32)
	model.to(dev).eval()
	cfg = model.config
	n_layers, n_heads = cfg.num_hidden_layers, cfg.num_attention_heads
	images = _load_images(num_samples)
	acc = None; seq_len = None; count = 0
	for s in range(0, len(images), 4):
	batch = images[s:s + 4]
	inp = proc(images=batch, return_tensors="pt").to(dev)
	with torch.no_grad():
	out = model(**inp, output_attentions=True)
	atts = out.attentions
	if atts is None or atts[0] is None:
	raise RuntimeError(f"{model_id} returned no attentions")
	if acc is None:
	seq_len = atts[0].shape[-1]
	acc = np.zeros((n_layers, n_heads, seq_len, seq_len), dtype=np.float64)
	for L in range(n_layers):
	acc[L] += atts[L].sum(dim=0).float().cpu().numpy()
	count += len(batch)
	acc /= count
	return acc, n_layers, n_heads, int(cfg.hidden_size), int(seq_len)


	def _load_images(n):
	"""n PIL RGB images: HF cifar10 test split, with a COCO-URL fallback."""
	from PIL import Image
	imgs = []
	try:
	from datasets import load_dataset
	ds = load_dataset("uoft-cs/cifar10", split=f"test[:{n}]")
	col = "img" if "img" in ds.column_names else ds.column_names[0]
	imgs = [ds[i][col].convert("RGB") for i in range(len(ds))]
	except Exception:
	pass
	if len(imgs) < 4:
	import io
	import urllib.request
	urls = [
	"http://images.cocodataset.org/val2017/000000039769.jpg",
	"http://images.cocodataset.org/val2017/000000000139.jpg",
	"http://images.cocodataset.org/val2017/000000000285.jpg",
	"http://images.cocodataset.org/val2017/000000000632.jpg",
	"http://images.cocodataset.org/val2017/000000000724.jpg",
	"http://images.cocodataset.org/val2017/000000000776.jpg",
	"http://images.cocodataset.org/val2017/000000000785.jpg",
	"http://images.cocodataset.org/val2017/000000000802.jpg",
	]
	for u in urls[:max(n, 8)]:
	try:
	with urllib.request.urlopen(u, timeout=20) as r:
	imgs.append(Image.open(io.BytesIO(r.read())).convert("RGB"))
	except Exception:
	pass
	if not imgs:
	raise RuntimeError("could not load any probe images")
	return imgs[:n]


	def scan_model(model_id, num_samples=16):
	"""Full structural scan of a HuggingFace transformer.

	Loads the model with output_attentions, runs it on probe data appropriate to
	its modality (16 sentences for text, 16 CIFAR-10 images for vision), builds
	the per-layer attention-correlation graph (Pearson r > 0.3) and computes the
	spectral hierarchy + fragility index per layer. Returns a scan-shaped dict
	consumable by `summarize` and the UI renderers."""
	import torch
	from transformers import AutoConfig
	dev = "cuda" if torch.cuda.is_available() else "cpu"

	cfg = AutoConfig.from_pretrained(model_id)
	modality = _detect_modality(cfg)

	if modality == "vision":
	acc, n_layers, n_heads, hidden, seq_len = _extract_vision(model_id, dev, num_samples)
	else:
	acc, n_layers, n_heads, hidden, seq_len = _extract_text(model_id, dev)

	per_layer = []
	for L in range(n_layers):
	C = _corr(acc[L].reshape(n_heads, -1))
	rec = hierarchy(C, THRESHOLD, edge_cap=400)
	rec["layer"] = L
	per_layer.append(rec)

	# Global graph base FI over all heads (for the headline fragility number).
	global_sigs = acc.reshape(n_layers * n_heads, -1)
	grec = hierarchy(_corr(global_sigs), THRESHOLD, edge_cap=10 ** 9, giant=True)

	label = PRELOADED.get(model_id, {}).get("label") or model_id.split("/")[-1]
	params = PRELOADED.get(model_id, {}).get("params")
	return {
	"model_id": model_id,
	"label": label,
	"arch": _arch_label(modality),
	"modality": modality,
	"n_layers": n_layers,
	"n_heads": n_heads,
	"hidden": hidden,
	"params": params,
	"per_layer": per_layer,
	"fi_base": grec["fi"],
	"source": "live",
	}


	def get_result(model_id, force_rescan=False):
	"""Cache-first scan: return the precomputed block for a pre-loaded model, or
	run a live scan (custom models, DistilBERT, or an explicit re-scan)."""
	if not force_rescan:
	cached = cached_result(model_id)
	if cached is not None:
	return cached
	return scan_model(model_id)