Spaces:

cdpearlman
/

LLMVis

Sleeping

cdpearlman commited on Dec 23, 2025

Commit

c19d5a8

1 Parent(s): 4c3d673

Fixed errors for beam search refactor

Files changed (14) hide show

app.py CHANGED Viewed

@@ -827,8 +827,13 @@ def create_layer_accordions(activation_data, activation_data2, original_activati
         tracking_data = compute_layer_wise_summaries(layer_data, activation_data)
         layer_wise_probs = tracking_data.get('layer_wise_top5_probs', {})
         significant_layers = tracking_data.get('significant_layers', [])
         global_top5 = activation_data.get('global_top5_tokens', [])
         # If in ablation mode, also extract original layer data
         original_layer_data = None
         original_layer_wise_probs = {}
@@ -855,6 +860,10 @@ def create_layer_accordions(activation_data, activation_data2, original_activati
             layer_wise_probs2 = tracking_data2.get('layer_wise_top5_probs', {})
             significant_layers2 = tracking_data2.get('significant_layers', [])
             global_top5_2 = activation_data2.get('global_top5_tokens', [])
         # Create accordion panels (reversed to show final layer first)
         accordions = []

         tracking_data = compute_layer_wise_summaries(layer_data, activation_data)
         layer_wise_probs = tracking_data.get('layer_wise_top5_probs', {})
         significant_layers = tracking_data.get('significant_layers', [])
+        # Get global top 5 tokens from activation data
         global_top5 = activation_data.get('global_top5_tokens', [])
+        # Ensure global_top5 is list of dicts (handle legacy tuples/lists from old sessions)
+        if global_top5 and isinstance(global_top5[0], (list, tuple)):
+            global_top5 = [{'token': t, 'probability': p} for t, p in global_top5]
         # If in ablation mode, also extract original layer data
         original_layer_data = None
         original_layer_wise_probs = {}
             layer_wise_probs2 = tracking_data2.get('layer_wise_top5_probs', {})
             significant_layers2 = tracking_data2.get('significant_layers', [])
             global_top5_2 = activation_data2.get('global_top5_tokens', [])
+            # Ensure global_top5_2 is list of dicts (handle legacy tuples)
+            if global_top5_2 and isinstance(global_top5_2[0], (list, tuple)):
+                global_top5_2 = [{'token': t, 'probability': p} for t, p in global_top5_2]
         # Create accordion panels (reversed to show final layer first)
         accordions = []

components/__pycache__/__init__.cpython-311.pyc DELETED Viewed

Binary file (177 Bytes)

components/__pycache__/glossary.cpython-311.pyc DELETED Viewed

Binary file (4.69 kB)

components/__pycache__/main_panel.cpython-311.pyc DELETED Viewed

Binary file (5.08 kB)

components/__pycache__/model_selector.cpython-311.pyc DELETED Viewed

Binary file (2.87 kB)

components/__pycache__/sidebar.cpython-311.pyc DELETED Viewed

Binary file (3.34 kB)

components/__pycache__/tokenization_panel.cpython-311.pyc DELETED Viewed

Binary file (9.78 kB)

utils/__pycache__/__init__.cpython-311.pyc DELETED Viewed

Binary file (1.86 kB)

utils/__pycache__/beam_search.cpython-311.pyc DELETED Viewed

Binary file (7 kB)

utils/__pycache__/head_detection.cpython-311.pyc DELETED Viewed

Binary file (16.1 kB)

utils/__pycache__/model_config.cpython-311.pyc DELETED Viewed

Binary file (8.45 kB)

utils/__pycache__/model_patterns.cpython-311.pyc DELETED Viewed

Binary file (59.4 kB)

utils/__pycache__/prompt_comparison.cpython-311.pyc DELETED Viewed

Binary file (13.9 kB)

utils/model_patterns.py CHANGED Viewed

@@ -92,7 +92,7 @@ def merge_token_probabilities(token_probs: List[Tuple[str, float]]) -> List[Tupl
     return result
-def compute_global_top5_tokens(model_output, tokenizer, top_k: int = 5) -> List[Tuple[str, float]]:
     """
     Compute the global top-5 tokens from model's final output with merged probabilities.
@@ -102,7 +102,7 @@ def compute_global_top5_tokens(model_output, tokenizer, top_k: int = 5) -> List[
         top_k: Number of top tokens to return (default: 5)
     Returns:
-        List of (token_string, probability) tuples for top K tokens with merged probabilities
     """
     with torch.no_grad():
         # Get probabilities for next token (last position)
@@ -121,8 +121,8 @@ def compute_global_top5_tokens(model_output, tokenizer, top_k: int = 5) -> List[
         # Merge tokens with/without leading space
         merged = merge_token_probabilities(candidates)
-        # Return top K after merging
-        return merged[:top_k]
 def get_actual_model_output(model_output, tokenizer) -> Tuple[str, float]:
@@ -1048,7 +1048,12 @@ def extract_layer_data(activation_data: Dict[str, Any], model, tokenizer) -> Lis
     # Get global top 5 tokens from final output
     global_top5_tokens = activation_data.get('global_top5_tokens', [])
-    global_top5_token_names = [token for token, _ in global_top5_tokens]
     layer_data = []
     prev_token_probs = {}  # Track previous layer's token probabilities (layer's own top 5)

     return result
+def compute_global_top5_tokens(model_output, tokenizer, top_k: int = 5) -> List[Dict[str, Any]]:
     """
     Compute the global top-5 tokens from model's final output with merged probabilities.
         top_k: Number of top tokens to return (default: 5)
     Returns:
+        List of dicts {'token': str, 'probability': float} for top K tokens
     """
     with torch.no_grad():
         # Get probabilities for next token (last position)
         # Merge tokens with/without leading space
         merged = merge_token_probabilities(candidates)
+        # Return top K after merging, formatted as dicts
+        return [{'token': t, 'probability': p} for t, p in merged[:top_k]]
 def get_actual_model_output(model_output, tokenizer) -> Tuple[str, float]:
     # Get global top 5 tokens from final output
     global_top5_tokens = activation_data.get('global_top5_tokens', [])
+    # Handle both dicts (new format) and tuples (legacy)
+    if global_top5_tokens and isinstance(global_top5_tokens[0], dict):
+        global_top5_token_names = [t.get('token') for t in global_top5_tokens]
+    else:
+        global_top5_token_names = [token for token, _ in global_top5_tokens]
     layer_data = []
     prev_token_probs = {}  # Track previous layer's token probabilities (layer's own top 5)