diff --git a/.gitignore b/.gitignore
index 2017073d7b72ec8afc14c30950ba209b829c4f1c..79796946618c59d07a83cdd1e7072f33a6f371bb 100644
--- a/.gitignore
+++ b/.gitignore
@@ -19,7 +19,8 @@ node_modules/
 *.env
 *.cache
 
-app/scripts/latex-converter/input-example/
+app/scripts/latex-converter/input/
+app/scripts/latex-converter/output/
 
 # PDF export
 app/public/*.pdf
diff --git a/app/.astro/astro/content.d.ts b/app/.astro/astro/content.d.ts
index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..bba937b3dafa7018a200be372604d19a76078a60 100644
--- a/app/.astro/astro/content.d.ts
+++ b/app/.astro/astro/content.d.ts
@@ -0,0 +1,247 @@
+declare module 'astro:content' {
+	interface Render {
+		'.mdx': Promise<{
+			Content: import('astro').MarkdownInstance<{}>['Content'];
+			headings: import('astro').MarkdownHeading[];
+			remarkPluginFrontmatter: Record<string, any>;
+			components: import('astro').MDXInstance<{}>['components'];
+		}>;
+	}
+}
+
+declare module 'astro:content' {
+	interface RenderResult {
+		Content: import('astro/runtime/server/index.js').AstroComponentFactory;
+		headings: import('astro').MarkdownHeading[];
+		remarkPluginFrontmatter: Record<string, any>;
+	}
+	interface Render {
+		'.md': Promise<RenderResult>;
+	}
+
+	export interface RenderedContent {
+		html: string;
+		metadata?: {
+			imagePaths: Array<string>;
+			[key: string]: unknown;
+		};
+	}
+}
+
+declare module 'astro:content' {
+	type Flatten<T> = T extends { [K: string]: infer U } ? U : never;
+
+	export type CollectionKey = keyof AnyEntryMap;
+	export type CollectionEntry<C extends CollectionKey> = Flatten<AnyEntryMap[C]>;
+
+	export type ContentCollectionKey = keyof ContentEntryMap;
+	export type DataCollectionKey = keyof DataEntryMap;
+
+	type AllValuesOf<T> = T extends any ? T[keyof T] : never;
+	type ValidContentEntrySlug<C extends keyof ContentEntryMap> = AllValuesOf<
+		ContentEntryMap[C]
+	>['slug'];
+
+	/** @deprecated Use `getEntry` instead. */
+	export function getEntryBySlug<
+		C extends keyof ContentEntryMap,
+		E extends ValidContentEntrySlug<C> | (string & {}),
+	>(
+		collection: C,
+		// Note that this has to accept a regular string too, for SSR
+		entrySlug: E,
+	): E extends ValidContentEntrySlug<C>
+		? Promise<CollectionEntry<C>>
+		: Promise<CollectionEntry<C> | undefined>;
+
+	/** @deprecated Use `getEntry` instead. */
+	export function getDataEntryById<C extends keyof DataEntryMap, E extends keyof DataEntryMap[C]>(
+		collection: C,
+		entryId: E,
+	): Promise<CollectionEntry<C>>;
+
+	export function getCollection<C extends keyof AnyEntryMap, E extends CollectionEntry<C>>(
+		collection: C,
+		filter?: (entry: CollectionEntry<C>) => entry is E,
+	): Promise<E[]>;
+	export function getCollection<C extends keyof AnyEntryMap>(
+		collection: C,
+		filter?: (entry: CollectionEntry<C>) => unknown,
+	): Promise<CollectionEntry<C>[]>;
+
+	export function getEntry<
+		C extends keyof ContentEntryMap,
+		E extends ValidContentEntrySlug<C> | (string & {}),
+	>(entry: {
+		collection: C;
+		slug: E;
+	}): E extends ValidContentEntrySlug<C>
+		? Promise<CollectionEntry<C>>
+		: Promise<CollectionEntry<C> | undefined>;
+	export function getEntry<
+		C extends keyof DataEntryMap,
+		E extends keyof DataEntryMap[C] | (string & {}),
+	>(entry: {
+		collection: C;
+		id: E;
+	}): E extends keyof DataEntryMap[C]
+		? Promise<DataEntryMap[C][E]>
+		: Promise<CollectionEntry<C> | undefined>;
+	export function getEntry<
+		C extends keyof ContentEntryMap,
+		E extends ValidContentEntrySlug<C> | (string & {}),
+	>(
+		collection: C,
+		slug: E,
+	): E extends ValidContentEntrySlug<C>
+		? Promise<CollectionEntry<C>>
+		: Promise<CollectionEntry<C> | undefined>;
+	export function getEntry<
+		C extends keyof DataEntryMap,
+		E extends keyof DataEntryMap[C] | (string & {}),
+	>(
+		collection: C,
+		id: E,
+	): E extends keyof DataEntryMap[C]
+		? Promise<DataEntryMap[C][E]>
+		: Promise<CollectionEntry<C> | undefined>;
+
+	/** Resolve an array of entry references from the same collection */
+	export function getEntries<C extends keyof ContentEntryMap>(
+		entries: {
+			collection: C;
+			slug: ValidContentEntrySlug<C>;
+		}[],
+	): Promise<CollectionEntry<C>[]>;
+	export function getEntries<C extends keyof DataEntryMap>(
+		entries: {
+			collection: C;
+			id: keyof DataEntryMap[C];
+		}[],
+	): Promise<CollectionEntry<C>[]>;
+
+	export function render<C extends keyof AnyEntryMap>(
+		entry: AnyEntryMap[C][string],
+	): Promise<RenderResult>;
+
+	export function reference<C extends keyof AnyEntryMap>(
+		collection: C,
+	): import('astro/zod').ZodEffects<
+		import('astro/zod').ZodString,
+		C extends keyof ContentEntryMap
+			? {
+					collection: C;
+					slug: ValidContentEntrySlug<C>;
+				}
+			: {
+					collection: C;
+					id: keyof DataEntryMap[C];
+				}
+	>;
+	// Allow generic `string` to avoid excessive type errors in the config
+	// if `dev` is not running to update as you edit.
+	// Invalid collection names will be caught at build time.
+	export function reference<C extends string>(
+		collection: C,
+	): import('astro/zod').ZodEffects<import('astro/zod').ZodString, never>;
+
+	type ReturnTypeOrOriginal<T> = T extends (...args: any[]) => infer R ? R : T;
+	type InferEntrySchema<C extends keyof AnyEntryMap> = import('astro/zod').infer<
+		ReturnTypeOrOriginal<Required<ContentConfig['collections'][C]>['schema']>
+	>;
+
+	type ContentEntryMap = {
+		"chapters": {
+"00_abstract.mdx": {
+	id: "00_abstract.mdx";
+  slug: "00_abstract";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"01_introduction.mdx": {
+	id: "01_introduction.mdx";
+  slug: "01_introduction";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"02_classic_robotics.mdx": {
+	id: "02_classic_robotics.mdx";
+  slug: "02_classic_robotics";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"03_reinforcement_learning.mdx": {
+	id: "03_reinforcement_learning.mdx";
+  slug: "03_reinforcement_learning";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"04_imitation_learning.mdx": {
+	id: "04_imitation_learning.mdx";
+  slug: "04_imitation_learning";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"06_next_directions.mdx": {
+	id: "06_next_directions.mdx";
+  slug: "06_next_directions";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"07_conclusions.mdx": {
+	id: "07_conclusions.mdx";
+  slug: "07_conclusions";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+"A_foreword.mdx": {
+	id: "A_foreword.mdx";
+  slug: "a_foreword";
+  body: string;
+  collection: "chapters";
+  data: any
+} & { render(): Render[".mdx"] };
+};
+"embeds": {
+"vibe-code-d3-embeds-directives.md": {
+	id: "vibe-code-d3-embeds-directives.md";
+  slug: "vibe-code-d3-embeds-directives";
+  body: string;
+  collection: "embeds";
+  data: any
+} & { render(): Render[".md"] };
+};
+"test": {
+"converted-sample.mdx": {
+	id: "converted-sample.mdx";
+  slug: "converted-sample";
+  body: string;
+  collection: "test";
+  data: any
+} & { render(): Render[".mdx"] };
+};
+
+	};
+
+	type DataEntryMap = {
+		"assets": {
+"data/somedata": {
+	id: "data/somedata";
+  collection: "assets";
+  data: any
+};
+};
+
+	};
+
+	type AnyEntryMap = ContentEntryMap & DataEntryMap;
+
+	export type ContentConfig = never;
+}
diff --git a/app/scripts/latex-to-markdown/README.md b/app/scripts/latex-to-markdown/README.md
deleted file mode 100644
index 2e068e91f0ae92820087720c29a73dc5e0b315f5..0000000000000000000000000000000000000000
--- a/app/scripts/latex-to-markdown/README.md
+++ /dev/null
@@ -1,158 +0,0 @@
-# LaTeX to Markdown Toolkit
-
-Conversion modulaire de projets LaTeX vers Markdown avec Pandoc.
-
-## 🚀 Usage rapide
-
-```bash
-# Conversion complète (LaTeX + bibliographie)
-node index.mjs --clean
-
-# Seulement nettoyer la bibliographie
-node index.mjs --bib-only
-
-# Seulement convertir LaTeX (utilise une .bib existante)
-node index.mjs --convert-only
-```
-
-## 📁 Structure
-
-```
-latex-to-markdown/
-├── index.mjs              # Script principal
-├── latex-converter.mjs    # Convertisseur LaTeX → Markdown
-├── bib-cleaner.mjs       # Nettoyeur de bibliographie
-├── input/                # Dossier source LaTeX
-│   ├── main.tex
-│   ├── main.bib
-│   └── sections/
-└── output/               # Résultats de conversion
-    ├── main.md
-    └── main.bib
-```
-
-## 🔧 Modules
-
-### `index.mjs` - Script principal
-Point d'entrée unifié avec options complètes.
-
-**Options :**
-- `--input=PATH` : Fichier LaTeX source
-- `--output=PATH` : Dossier de sortie  
-- `--clean` : Nettoyer le dossier de sortie
-- `--bib-only` : Seulement nettoyer la bibliographie
-- `--convert-only` : Seulement convertir (skip bibliographie)
-
-### `latex-converter.mjs` - Convertisseur
-Conversion LaTeX vers Markdown avec Pandoc.
-
-**Fonctionnalités :**
-- Support natif des macros LaTeX (`+latex_macros`)
-- Gestion automatique des `\input{}`
-- Citations avec `--citeproc`
-- Extraction des images avec `--extract-media`
-- Support mathématique avec `--mathjax`
-
-### `bib-cleaner.mjs` - Nettoyeur de bibliographie
-Supprime les références externes des fichiers `.bib`.
-
-**Nettoyage :**
-- Supprime les `file = {...}` (chemins locaux)
-- Nettoie les virgules doubles
-- Élimine les lignes vides
-
-## 📊 Exemple de workflow
-
-```bash
-# 1. Placer vos fichiers LaTeX dans input/
-cp mon-projet/* input/
-
-# 2. Conversion complète
-node index.mjs --clean
-
-# 3. Récupérer les résultats dans output/
-ls output/
-# → main.md (Markdown converti)
-# → main.bib (Bibliographie nettoyée)
-```
-
-## ⚙️ Configuration avancée
-
-### Chemins personnalisés
-```bash
-node index.mjs \
-  --input=../paper/main.tex \
-  --output=../results/ \
-  --clean
-```
-
-### Usage programmatique
-```javascript
-import { convertLatexToMarkdown, cleanBibliography } from './index.mjs';
-
-// Conversion LaTeX
-await convertLatexToMarkdown('input.tex', 'output/');
-
-// Nettoyage bibliographie
-await cleanBibliography('refs.bib', 'clean-refs.bib');
-```
-
-## 🛠️ Prérequis
-
-- **Node.js** avec support ESM
-- **Pandoc** (`brew install pandoc`)
-
-## 🎯 Pandoc natif
-
-Le toolkit maximise l'utilisation de Pandoc natif :
-
-- **`+latex_macros`** : Gère `\newcommand`, `\renewcommand`
-- **`--citeproc`** : Traitement automatique des citations
-- **`--bibliography`** : Support de `.bib` files
-- **`--extract-media`** : Images automatiques
-- **`--mathjax`** : Mathématiques avancées
-
-Résultat : **95% Pandoc natif, 5% preprocessing minimal** ! 🚀
-
----
-
-## 📝 État Actuel du Projet
-
-### ✅ Complété
-- **Architecture modulaire** : `index.mjs` + `latex-converter.mjs` + `bib-cleaner.mjs`
-- **Preprocessing LaTeX** : Gestion des `\input{}` pour assembler le document complet
-- **Nettoyage bibliographie** : Suppression des références externes (`file = {...}`)
-- **Conversion Pandoc** : Format `gfm+tex_math_dollars` pour compatibilité Astro
-- **Citations sans crochets** : Format `@citationkey` au lieu de `[@citationkey]`
-- **Gestion des commandes personnalisées** : `\actionchunk`, `\textsc`, `\gets`, etc.
-- **Extraction d'images** : Support automatique via `--extract-media`
-
-### 🔧 En Cours de Résolution
-- **Erreurs Pandoc sur certaines sections** : 
-  - Section `03_reinforcement_learning.tex` contient des constructions LaTeX problématiques
-  - Erreur à la ligne 2011 : `unexpected }` dans le contexte de citations complexes
-  - Commande `\textsc{PopFront(\( \actionchunk_t \))}` mal interprétée
-
-### 🎯 Prochaines Étapes
-1. **Déboguer section 03** : Identifier et corriger les constructions LaTeX incompatibles
-2. **Test sections individuelles** : Valider chaque section séparément
-3. **Améliorer preprocessing** : Ajouter plus de transformations pour gérer les cas complexes
-4. **Validation finale** : Conversion complète du document
-
-### 🚨 Problèmes Identifiés
-- **Commandes imbriquées** : `\textsc{...(\( math \))}` pose problème à Pandoc
-- **Citations complexes** : Certains patterns de citations avec math inline
-- **Math environments** : Quelques environnements non reconnus correctement
-
-### 🔍 Diagnostic
-Dernière erreur :
-```
-Error at "temp_main.tex" (line 2011, column 234):
-unexpected }
-expecting \end{document}
-~@zhaoLearningFineGrainedBimanual2023 adopts a different strategy whereby...
-\( \actionchunk_t \gets \pi(o_t) \) and chunk consumption 
-\( a_t \gets \textsc{PopFront(\( \actionchunk_t \))} \)
-```
-
-Le problème semble être dans l'imbrication de `\textsc{}` avec des expressions mathématiques à l'intérieur.
diff --git a/app/scripts/latex-to-markdown/test-figure.tex b/app/scripts/latex-to-markdown/test-figure.tex
deleted file mode 100644
index 13a118ef63bd5fd09f1e9a4ffbe28c981d85b266..0000000000000000000000000000000000000000
--- a/app/scripts/latex-to-markdown/test-figure.tex
+++ /dev/null
@@ -1,6 +0,0 @@
-\begin{figure}
-\centering  
-\includegraphics{test.png}
-\caption{Test figure}
-\label{fig:test}
-\end{figure}
diff --git a/app/scripts/latex-to-mdx/README.md b/app/scripts/latex-to-mdx/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..6eb428dba27e92ce07d8d24955a9f7d522d94e8d
--- /dev/null
+++ b/app/scripts/latex-to-mdx/README.md
@@ -0,0 +1,169 @@
+# LaTeX to MDX Toolkit
+
+Complete LaTeX to MDX (Markdown + JSX) conversion optimized for Astro with advanced support for references, interactive equations, and components.
+
+## 🚀 Quick Start
+
+```bash
+# Complete LaTeX → MDX conversion with all features
+node index.mjs
+
+# For step-by-step debugging
+node latex-converter.mjs    # LaTeX → Markdown
+node mdx-converter.mjs      # Markdown → MDX
+```
+
+## 📁 Structure
+
+```
+latex-to-mdx/
+├── index.mjs                    # Complete LaTeX → MDX pipeline
+├── latex-converter.mjs          # LaTeX → Markdown with Pandoc
+├── mdx-converter.mjs           # Markdown → MDX with Astro components
+├── reference-preprocessor.mjs  # LaTeX references cleanup
+├── post-processor.mjs          # Markdown post-processing
+├── bib-cleaner.mjs            # Bibliography cleaner
+├── filters/
+│   └── equation-ids.lua        # Pandoc filter for KaTeX equations
+├── input/                      # LaTeX sources
+│   ├── main.tex
+│   ├── main.bib
+│   └── sections/
+└── output/                     # Results
+    ├── main.md                 # Intermediate Markdown
+    └── main.mdx               # Final MDX for Astro
+```
+
+## ✨ Key Features
+
+### 🎯 **Smart References**
+- **Invisible anchors**: Automatic conversion of `\label{}` to `<span id="..." style="position: absolute;"></span>`
+- **Clean links**: Identifier cleanup (`:` → `-`, removing prefixes `sec:`, `fig:`, `eq:`)
+- **Cross-references**: Full support for `\ref{}` with functional links
+
+### 🧮 **Interactive Equations**
+- **KaTeX IDs**: Conversion of `\label{eq:...}` to `\htmlId{id}{equation}` 
+- **Equation references**: Clickable links to mathematical equations
+- **Advanced KaTeX support**: `trust: true` configuration for `\htmlId{}`
+
+### 🎨 **Automatic Styling**  
+- **Highlights**: `\highlight{text}` → `<span class="highlight">text</span>`
+- **Auto cleanup**: Removal of numbering `(1)`, `(2)`, etc.
+- **Astro components**: Images → `ResponsiveImage` with automatic imports
+
+### 🔧 **Robust Pipeline**
+- **LaTeX preprocessor**: Reference cleanup before Pandoc
+- **Lua filter**: Equation processing in Pandoc AST  
+- **Post-processor**: Markdown cleanup and optimization
+- **MDX converter**: Final transformation with Astro components
+
+## 📊 Example Workflow
+
+```bash
+# 1. Prepare LaTeX sources
+cp my-paper/* input/
+
+# 2. Complete automatic conversion
+node index.mjs
+
+# 3. Generated results
+ls output/
+# → main.md (Intermediate Markdown)  
+# → main.mdx (Final MDX for Astro)
+# → assets/image/ (extracted images)
+```
+
+### 📋 Conversion Result
+
+The pipeline generates an MDX file optimized for Astro with:
+
+```mdx
+---
+title: "Your Article Title"
+description: "Generated from LaTeX"
+---
+
+import ResponsiveImage from '../components/ResponsiveImage.astro';
+import figure1 from '../assets/image/figure1.png';
+
+## Section with invisible anchor
+<span id="introduction" style="position: absolute;"></span>
+
+Here is some text with <span class="highlight">highlighted words</span>.
+
+Reference to an interactive [equation](#equation-name).
+
+Equation with KaTeX ID:
+$$\htmlId{equation-name}{E = mc^2}$$
+
+<ResponsiveImage src={figure1} alt="Description" />
+```
+
+## ⚙️ Required Astro Configuration
+
+To use equations with IDs, add to `astro.config.mjs`:
+
+```javascript
+import rehypeKatex from 'rehype-katex';
+
+export default defineConfig({
+  markdown: {
+    rehypePlugins: [
+      [rehypeKatex, { trust: true }], // ← Important for \htmlId{}
+    ],
+  },
+});
+```
+
+## 🛠️ Prerequisites
+
+- **Node.js** with ESM support
+- **Pandoc** (`brew install pandoc`)
+- **Astro** to use the generated MDX
+
+## 🎯 Technical Architecture
+
+### 4-Stage Pipeline
+
+1. **LaTeX Preprocessing** (`reference-preprocessor.mjs`)
+   - Cleanup of `\label{}` and `\ref{}`
+   - Conversion `\highlight{}` → CSS spans
+   - Removal of prefixes and problematic characters
+
+2. **Pandoc + Lua Filter** (`equation-ids.lua`)
+   - LaTeX → Markdown conversion with `gfm+tex_math_dollars+raw_html`
+   - Equation processing: `\label{eq:name}` → `\htmlId{name}{equation}`
+   - Automatic image extraction
+
+3. **Markdown Post-processing** (`post-processor.mjs`)
+   - KaTeX, Unicode, grouping commands cleanup
+   - Attribute correction with `:` 
+   - Code snippet injection
+
+4. **MDX Conversion** (`mdx-converter.mjs`)
+   - Images transformation → `ResponsiveImage`
+   - HTML span escaping correction
+   - Automatic imports generation
+   - MDX frontmatter
+
+## 📊 Conversion Statistics
+
+For a typical scientific document:
+- **87 labels** detected and processed
+- **48 invisible anchors** created  
+- **13 highlight spans** with CSS class
+- **4 equations** with `\htmlId{}` KaTeX
+- **40 images** converted to components
+
+## ✅ Project Status
+
+### 🎉 **Complete Features**
+- ✅ **LaTeX → MDX Pipeline**: Full end-to-end functional conversion
+- ✅ **Cross-document references**: Perfectly functional internal links  
+- ✅ **Interactive equations**: KaTeX support with clickable IDs
+- ✅ **Automatic styling**: Highlights and Astro components
+- ✅ **Robustness**: Automatic cleanup of all escaping
+- ✅ **Optimization**: Clean code without unnecessary elements
+
+### 🚀 **Production Ready**
+The toolkit is now **100% operational** for converting complex scientific LaTeX documents to MDX/Astro with all advanced features (references, interactive equations, styling).
diff --git a/app/scripts/latex-to-markdown/bib-cleaner.mjs b/app/scripts/latex-to-mdx/bib-cleaner.mjs
similarity index 100%
rename from app/scripts/latex-to-markdown/bib-cleaner.mjs
rename to app/scripts/latex-to-mdx/bib-cleaner.mjs
diff --git a/app/scripts/latex-to-markdown/filters/equation-ids.lua b/app/scripts/latex-to-mdx/filters/equation-ids.lua
similarity index 74%
rename from app/scripts/latex-to-markdown/filters/equation-ids.lua
rename to app/scripts/latex-to-mdx/filters/equation-ids.lua
index 4e97706ba9f915a2b1b6094c8bcfab44530222f4..86c980f35db55a4869708694930218c7fb32d219 100644
--- a/app/scripts/latex-to-markdown/filters/equation-ids.lua
+++ b/app/scripts/latex-to-mdx/filters/equation-ids.lua
@@ -48,17 +48,34 @@ function Math(el)
         -- Clean up any extra whitespace or line breaks that might remain
         clean_math = clean_math:gsub("%s*$", ""):gsub("^%s*", "")
         
-        -- Remove problematic equation environments that don't work well with \htmlId
-        clean_math = clean_math:gsub("\\begin%{equation%}", ""):gsub("\\end%{equation%}", "")
-        clean_math = clean_math:gsub("\\begin%{align%}", ""):gsub("\\end%{align%}", "")
-        clean_math = clean_math:gsub("\\begin%{equation%*%}", ""):gsub("\\end%{equation%*%}", "")
-        clean_math = clean_math:gsub("\\begin%{align%*%}", ""):gsub("\\end%{align%*%}", "")
+        -- Handle different equation environments appropriately
+        -- For align environments, preserve them as they work with KaTeX
+        local has_align = clean_math:match("\\begin%{align%}")
+        
+        if has_align then
+            -- For align environments, we keep the structure and add ID as an attribute
+            -- KaTeX supports align environments natively
+            clean_math = clean_math:gsub("\\begin%{align%}", "\\begin{align}")
+            clean_math = clean_math:gsub("\\end%{align%}", "\\end{align}")
+        else
+            -- Remove other equation environments that don't work well with \htmlId
+            clean_math = clean_math:gsub("\\begin%{equation%}", ""):gsub("\\end%{equation%}", "")
+            clean_math = clean_math:gsub("\\begin%{equation%*%}", ""):gsub("\\end%{equation%*%}", "")
+            clean_math = clean_math:gsub("\\begin%{align%*%}", ""):gsub("\\end%{align%*%}", "")
+        end
         
         -- Clean up any remaining whitespace
         clean_math = clean_math:gsub("%s*$", ""):gsub("^%s*", "")
         
-        -- Wrap the equation content with \htmlId{}
-        local new_math = "\\htmlId{" .. clean_id .. "}{" .. clean_math .. "}"
+        local new_math
+        if has_align then
+            -- For align environments, add the ID differently - KaTeX doesn't support \htmlId with align
+            -- Instead, we'll add a span with the ID right before the align
+            new_math = clean_math
+        else
+            -- For other math, wrap with \htmlId{}
+            new_math = "\\htmlId{" .. clean_id .. "}{" .. clean_math .. "}"
+        end
         
         -- Return new Math element with the updated content
         return pandoc.Math(el.mathtype, new_math)
diff --git a/app/scripts/latex-to-markdown/index.mjs b/app/scripts/latex-to-mdx/index.mjs
similarity index 100%
rename from app/scripts/latex-to-markdown/index.mjs
rename to app/scripts/latex-to-mdx/index.mjs
diff --git a/app/scripts/latex-to-markdown/input/.gitignore b/app/scripts/latex-to-mdx/input/.gitignore
similarity index 100%
rename from app/scripts/latex-to-markdown/input/.gitignore
rename to app/scripts/latex-to-mdx/input/.gitignore
diff --git a/app/scripts/latex-to-markdown/input/README.md b/app/scripts/latex-to-mdx/input/README.md
similarity index 100%
rename from app/scripts/latex-to-markdown/input/README.md
rename to app/scripts/latex-to-mdx/input/README.md
diff --git a/app/scripts/latex-to-markdown/input/_minted/62B8750C0ACEBDA39A95140434E540A8.highlight.minted b/app/scripts/latex-to-mdx/input/_minted/62B8750C0ACEBDA39A95140434E540A8.highlight.minted
similarity index 100%
rename from app/scripts/latex-to-markdown/input/_minted/62B8750C0ACEBDA39A95140434E540A8.highlight.minted
rename to app/scripts/latex-to-mdx/input/_minted/62B8750C0ACEBDA39A95140434E540A8.highlight.minted
diff --git a/app/scripts/latex-to-markdown/input/_minted/_FAD58DE7366495DB4650CFEFAC2FCD61.index.minted b/app/scripts/latex-to-mdx/input/_minted/_FAD58DE7366495DB4650CFEFAC2FCD61.index.minted
similarity index 100%
rename from app/scripts/latex-to-markdown/input/_minted/_FAD58DE7366495DB4650CFEFAC2FCD61.index.minted
rename to app/scripts/latex-to-mdx/input/_minted/_FAD58DE7366495DB4650CFEFAC2FCD61.index.minted
diff --git a/app/scripts/latex-to-markdown/input/_minted/colorful.style.minted b/app/scripts/latex-to-mdx/input/_minted/colorful.style.minted
similarity index 100%
rename from app/scripts/latex-to-markdown/input/_minted/colorful.style.minted
rename to app/scripts/latex-to-mdx/input/_minted/colorful.style.minted
diff --git a/app/scripts/latex-to-markdown/input/fancyhdr.sty b/app/scripts/latex-to-mdx/input/fancyhdr.sty
similarity index 100%
rename from app/scripts/latex-to-markdown/input/fancyhdr.sty
rename to app/scripts/latex-to-mdx/input/fancyhdr.sty
diff --git a/app/scripts/latex-to-markdown/input/figures/ch1/ch1-lerobot-figure1.png b/app/scripts/latex-to-mdx/input/figures/ch1/ch1-lerobot-figure1.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch1/ch1-lerobot-figure1.png
rename to app/scripts/latex-to-mdx/input/figures/ch1/ch1-lerobot-figure1.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-approaches.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-approaches.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-approaches.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-approaches.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-classical-limitations.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-classical-limitations.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-classical-limitations.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-classical-limitations.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-cost-accessibility.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-cost-accessibility.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-cost-accessibility.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-cost-accessibility.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor-box.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor-box.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor-box.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor-box.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor-shelf.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor-shelf.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor-shelf.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor-shelf.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-floor.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-floor.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-free.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-free.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-planar-manipulator-free.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-planar-manipulator-free.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-platforms.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-platforms.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-platforms.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-platforms.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch2/ch2-so100-to-planar-manipulator.png b/app/scripts/latex-to-mdx/input/figures/ch2/ch2-so100-to-planar-manipulator.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch2/ch2-so100-to-planar-manipulator.png
rename to app/scripts/latex-to-mdx/input/figures/ch2/ch2-so100-to-planar-manipulator.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-agent-env.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-agent-env.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-agent-env.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-agent-env.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-duck-sim-vs-real.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-duck-sim-vs-real.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-duck-sim-vs-real.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-duck-sim-vs-real.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-hil-serl-examples.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-hil-serl-examples.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-hil-serl-examples.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-hil-serl-examples.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-learning-atlas.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-learning-atlas.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-learning-atlas.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-learning-atlas.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-learning-benefits.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-learning-benefits.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-learning-benefits.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-learning-benefits.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-many-ducks.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-many-ducks.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-many-ducks.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-many-ducks.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-rl-algorithms-atlas.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-rl-algorithms-atlas.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-rl-algorithms-atlas.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-rl-algorithms-atlas.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch3/ch3-rl-examples.png b/app/scripts/latex-to-mdx/input/figures/ch3/ch3-rl-examples.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch3/ch3-rl-examples.png
rename to app/scripts/latex-to-mdx/input/figures/ch3/ch3-rl-examples.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-act-decoder.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-act-decoder.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-act-decoder.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-act-decoder.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-act-encoder.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-act-encoder.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-act-encoder.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-act-encoder.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-act.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-act.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-act.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-act.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-action-vs-observation-distribution.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-action-vs-observation-distribution.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-action-vs-observation-distribution.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-action-vs-observation-distribution.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-async-inference.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-async-inference.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-async-inference.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-async-inference.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-bc-trajectories.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-bc-trajectories.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-bc-trajectories.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-bc-trajectories.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-policy.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-policy.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-policy.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-policy.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-robot-actions.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-robot-actions.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-robot-actions.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-robot-actions.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-vs-flowmatching.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-vs-flowmatching.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-diffusion-vs-flowmatching.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-diffusion-vs-flowmatching.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-issues-with-bc.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-issues-with-bc.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-issues-with-bc.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-issues-with-bc.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-latent-variable-model.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-latent-variable-model.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-latent-variable-model.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-latent-variable-model.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-many-latents.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-many-latents.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-many-latents.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-many-latents.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-normalizing-flows.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-normalizing-flows.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-normalizing-flows.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-normalizing-flows.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-observation-action-mapping.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-observation-action-mapping.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-observation-action-mapping.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-observation-action-mapping.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-queues.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-queues.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-queues.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-queues.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch4/ch4-task-effect-on-pairs.png b/app/scripts/latex-to-mdx/input/figures/ch4/ch4-task-effect-on-pairs.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch4/ch4-task-effect-on-pairs.png
rename to app/scripts/latex-to-mdx/input/figures/ch4/ch4-task-effect-on-pairs.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-generalist-policies-timeline.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-generalist-policies-timeline.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-generalist-policies-timeline.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-generalist-policies-timeline.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-ml-vs-robotics-foundation.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-ml-vs-robotics-foundation.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-ml-vs-robotics-foundation.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-ml-vs-robotics-foundation.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-pi0-sampling-timesteps.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-pi0-sampling-timesteps.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-pi0-sampling-timesteps.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-pi0-sampling-timesteps.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-pi0.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-pi0.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-pi0.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-pi0.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-smolvla.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-smolvla.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-smolvla.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-smolvla.png
diff --git a/app/scripts/latex-to-markdown/input/figures/ch5/ch5-trends.png b/app/scripts/latex-to-mdx/input/figures/ch5/ch5-trends.png
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/ch5/ch5-trends.png
rename to app/scripts/latex-to-mdx/input/figures/ch5/ch5-trends.png
diff --git a/app/scripts/latex-to-markdown/input/figures/misc/lerobot-team.jpeg b/app/scripts/latex-to-mdx/input/figures/misc/lerobot-team.jpeg
similarity index 100%
rename from app/scripts/latex-to-markdown/input/figures/misc/lerobot-team.jpeg
rename to app/scripts/latex-to-mdx/input/figures/misc/lerobot-team.jpeg
diff --git a/app/scripts/latex-to-markdown/input/handles.tex b/app/scripts/latex-to-mdx/input/handles.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/handles.tex
rename to app/scripts/latex-to-mdx/input/handles.tex
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/defns.tex b/app/scripts/latex-to-mdx/input/hfstyle/defns.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/defns.tex
rename to app/scripts/latex-to-mdx/input/hfstyle/defns.tex
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/hf.cls b/app/scripts/latex-to-mdx/input/hfstyle/hf.cls
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/hf.cls
rename to app/scripts/latex-to-mdx/input/hfstyle/hf.cls
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/manrope.sty b/app/scripts/latex-to-mdx/input/hfstyle/manrope.sty
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/manrope.sty
rename to app/scripts/latex-to-mdx/input/hfstyle/manrope.sty
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/manrope/Manrope-Bold.ttf b/app/scripts/latex-to-mdx/input/hfstyle/manrope/Manrope-Bold.ttf
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/manrope/Manrope-Bold.ttf
rename to app/scripts/latex-to-mdx/input/hfstyle/manrope/Manrope-Bold.ttf
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/manrope/Manrope-Regular.ttf b/app/scripts/latex-to-mdx/input/hfstyle/manrope/Manrope-Regular.ttf
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/manrope/Manrope-Regular.ttf
rename to app/scripts/latex-to-mdx/input/hfstyle/manrope/Manrope-Regular.ttf
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/plainnat.bst b/app/scripts/latex-to-mdx/input/hfstyle/plainnat.bst
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/plainnat.bst
rename to app/scripts/latex-to-mdx/input/hfstyle/plainnat.bst
diff --git a/app/scripts/latex-to-markdown/input/hfstyle/template_content.tex b/app/scripts/latex-to-mdx/input/hfstyle/template_content.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/hfstyle/template_content.tex
rename to app/scripts/latex-to-mdx/input/hfstyle/template_content.tex
diff --git a/app/scripts/latex-to-markdown/input/main.bbl b/app/scripts/latex-to-mdx/input/main.bbl
similarity index 100%
rename from app/scripts/latex-to-markdown/input/main.bbl
rename to app/scripts/latex-to-mdx/input/main.bbl
diff --git a/app/scripts/latex-to-markdown/input/main.bib b/app/scripts/latex-to-mdx/input/main.bib
similarity index 100%
rename from app/scripts/latex-to-markdown/input/main.bib
rename to app/scripts/latex-to-mdx/input/main.bib
diff --git a/app/scripts/latex-to-markdown/input/main.dvi b/app/scripts/latex-to-mdx/input/main.dvi
similarity index 100%
rename from app/scripts/latex-to-markdown/input/main.dvi
rename to app/scripts/latex-to-mdx/input/main.dvi
diff --git a/app/scripts/latex-to-markdown/input/main.tex b/app/scripts/latex-to-mdx/input/main.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/main.tex
rename to app/scripts/latex-to-mdx/input/main.tex
diff --git a/app/scripts/latex-to-markdown/input/manropebold.tfm b/app/scripts/latex-to-mdx/input/manropebold.tfm
similarity index 100%
rename from app/scripts/latex-to-markdown/input/manropebold.tfm
rename to app/scripts/latex-to-mdx/input/manropebold.tfm
diff --git a/app/scripts/latex-to-markdown/input/manroperegular.tfm b/app/scripts/latex-to-mdx/input/manroperegular.tfm
similarity index 100%
rename from app/scripts/latex-to-markdown/input/manroperegular.tfm
rename to app/scripts/latex-to-mdx/input/manroperegular.tfm
diff --git a/app/scripts/latex-to-markdown/input/math_commands.tex b/app/scripts/latex-to-mdx/input/math_commands.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/math_commands.tex
rename to app/scripts/latex-to-mdx/input/math_commands.tex
diff --git a/app/scripts/latex-to-markdown/input/natbib.sty b/app/scripts/latex-to-mdx/input/natbib.sty
similarity index 100%
rename from app/scripts/latex-to-markdown/input/natbib.sty
rename to app/scripts/latex-to-mdx/input/natbib.sty
diff --git a/app/scripts/latex-to-markdown/input/preamble.tex b/app/scripts/latex-to-mdx/input/preamble.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/preamble.tex
rename to app/scripts/latex-to-mdx/input/preamble.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/00_abstract.tex b/app/scripts/latex-to-mdx/input/sections/00_abstract.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/00_abstract.tex
rename to app/scripts/latex-to-mdx/input/sections/00_abstract.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/01_introduction.tex b/app/scripts/latex-to-mdx/input/sections/01_introduction.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/01_introduction.tex
rename to app/scripts/latex-to-mdx/input/sections/01_introduction.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/02_classic_robotics.tex b/app/scripts/latex-to-mdx/input/sections/02_classic_robotics.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/02_classic_robotics.tex
rename to app/scripts/latex-to-mdx/input/sections/02_classic_robotics.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/03_reinforcement_learning.tex b/app/scripts/latex-to-mdx/input/sections/03_reinforcement_learning.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/03_reinforcement_learning.tex
rename to app/scripts/latex-to-mdx/input/sections/03_reinforcement_learning.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/04_imitation_learning.tex b/app/scripts/latex-to-mdx/input/sections/04_imitation_learning.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/04_imitation_learning.tex
rename to app/scripts/latex-to-mdx/input/sections/04_imitation_learning.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/05_foundation_models.tex b/app/scripts/latex-to-mdx/input/sections/05_foundation_models.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/05_foundation_models.tex
rename to app/scripts/latex-to-mdx/input/sections/05_foundation_models.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/05_foundation_models.tex.temp b/app/scripts/latex-to-mdx/input/sections/05_foundation_models.tex.temp
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/05_foundation_models.tex.temp
rename to app/scripts/latex-to-mdx/input/sections/05_foundation_models.tex.temp
diff --git a/app/scripts/latex-to-markdown/input/sections/06_next_directions.tex b/app/scripts/latex-to-mdx/input/sections/06_next_directions.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/06_next_directions.tex
rename to app/scripts/latex-to-mdx/input/sections/06_next_directions.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/07_conclusions.tex b/app/scripts/latex-to-mdx/input/sections/07_conclusions.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/07_conclusions.tex
rename to app/scripts/latex-to-mdx/input/sections/07_conclusions.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/A_foreword.tex b/app/scripts/latex-to-mdx/input/sections/A_foreword.tex
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/A_foreword.tex
rename to app/scripts/latex-to-mdx/input/sections/A_foreword.tex
diff --git a/app/scripts/latex-to-markdown/input/sections/test.md b/app/scripts/latex-to-mdx/input/sections/test.md
similarity index 100%
rename from app/scripts/latex-to-markdown/input/sections/test.md
rename to app/scripts/latex-to-mdx/input/sections/test.md
diff --git a/app/scripts/latex-to-markdown/input/snippets/01_1_datasets.py b/app/scripts/latex-to-mdx/input/snippets/01_1_datasets.py
similarity index 100%
rename from app/scripts/latex-to-markdown/input/snippets/01_1_datasets.py
rename to app/scripts/latex-to-mdx/input/snippets/01_1_datasets.py
diff --git a/app/scripts/latex-to-markdown/input/t1manrope.fd b/app/scripts/latex-to-mdx/input/t1manrope.fd
similarity index 100%
rename from app/scripts/latex-to-markdown/input/t1manrope.fd
rename to app/scripts/latex-to-mdx/input/t1manrope.fd
diff --git a/app/scripts/latex-to-markdown/latex-converter.mjs b/app/scripts/latex-to-mdx/latex-converter.mjs
similarity index 89%
rename from app/scripts/latex-to-markdown/latex-converter.mjs
rename to app/scripts/latex-to-mdx/latex-converter.mjs
index 9f57143b5757f7cd3d3431509a64521a88800784..7079e2e43b85e9947a771a33a9ef22adb329f35a 100644
--- a/app/scripts/latex-to-markdown/latex-converter.mjs
+++ b/app/scripts/latex-to-mdx/latex-converter.mjs
@@ -67,13 +67,23 @@ function preprocessLatexFile(inputFile, outputDir) {
     content = content.replace(/\\end\{equation\*\}\$\$/g, '$$');
     content = content.replace(/\\begin\{equation\*\}/g, '$$');
     content = content.replace(/\\end\{equation\*\}/g, '$$');
-    content = content.replace(/\\begin\{align\}/g, '$$');
-    content = content.replace(/\\end\{align\}/g, '$$');
+    // Keep align environments intact for KaTeX support
+    // Protect align environments by temporarily replacing them before cleaning & operators
+    const alignBlocks = [];
+    content = content.replace(/\\begin\{align\}([\s\S]*?)\\end\{align\}/g, (match, alignContent) => {
+        alignBlocks.push(match);
+        return `__ALIGN_BLOCK_${alignBlocks.length - 1}__`;
+    });
 
-    // Remove ALL alignment operators (&) from math content - purely cosmetic
+    // Now remove & operators from non-align content (outside align environments)
     content = content.replace(/&=/g, '=');
     content = content.replace(/&/g, '');
 
+    // Restore align blocks with their & operators intact
+    alignBlocks.forEach((block, index) => {
+        content = content.replace(`__ALIGN_BLOCK_${index}__`, block);
+    });
+
     // Convert LaTeX citations to Pandoc format
     content = content.replace(/\\cite[tp]?\{([^}]+)\}/g, (match, citations) => {
         // Handle multiple citations separated by commas - all become simple @citations
@@ -144,17 +154,27 @@ function preprocessLatexFile(inputFile, outputDir) {
                 return `\\text{${simplified}}`;
             });
 
-            // Remove alignment operators in included content too
+            // Apply same align-preserving logic to included content
+            const alignBlocksIncluded = [];
+            includedContent = includedContent.replace(/\\begin\{align\}([\s\S]*?)\\end\{align\}/g, (match, alignContent) => {
+                alignBlocksIncluded.push(match);
+                return `__ALIGN_BLOCK_${alignBlocksIncluded.length - 1}__`;
+            });
+
+            // Remove alignment operators from non-align content in included files
             includedContent = includedContent.replace(/&=/g, '=');
             includedContent = includedContent.replace(/&/g, '');
 
+            // Restore align blocks with their & operators intact
+            alignBlocksIncluded.forEach((block, index) => {
+                includedContent = includedContent.replace(`__ALIGN_BLOCK_${index}__`, block);
+            });
+
             // Convert math environments in included content
             includedContent = includedContent.replace(/\$\$\\begin\{equation\*\}/g, '$$');
             includedContent = includedContent.replace(/\\end\{equation\*\}\$\$/g, '$$');
             includedContent = includedContent.replace(/\\begin\{equation\*\}/g, '$$');
             includedContent = includedContent.replace(/\\end\{equation\*\}/g, '$$');
-            includedContent = includedContent.replace(/\\begin\{align\}/g, '$$');
-            includedContent = includedContent.replace(/\\end\{align\}/g, '$$');
 
             // Convert citations in included content
             includedContent = includedContent.replace(/\\cite[tp]?\{([^}]+)\}/g, (match, citations) => {
diff --git a/app/scripts/latex-to-markdown/mdx-converter.mjs b/app/scripts/latex-to-mdx/mdx-converter.mjs
similarity index 80%
rename from app/scripts/latex-to-markdown/mdx-converter.mjs
rename to app/scripts/latex-to-mdx/mdx-converter.mjs
index 35416a144a048bce821201600831308fdece576c..292027eabaa75fc18f34add9f2a688753a67fe6c 100644
--- a/app/scripts/latex-to-markdown/mdx-converter.mjs
+++ b/app/scripts/latex-to-mdx/mdx-converter.mjs
@@ -328,7 +328,6 @@ function fixHtmlEscaping(content) {
 
     let fixedCount = 0;
 
-    // Fix escaped HTML in anchor spans with various escaping patterns
     // Pattern 1: \<span id="..." style="..."\>\</span\>
     content = content.replace(/\\<span id="([^"]*)" style="([^"]*)"\\>\\<\/span\\>/g, (match, id, style) => {
         fixedCount++;
@@ -348,6 +347,26 @@ function fixHtmlEscaping(content) {
         return `<span class="${className}">${cleanText}</span>`;
     });
 
+    // Pattern 3: HTML-encoded spans in paragraph tags
+    // <p>&lt;span id="..." style="..."&gt;&lt;/span&gt;</p>
+    content = content.replace(/<p>&lt;span id="([^"]*)" style="([^"]*)"&gt;&lt;\/span&gt;<\/p>/g, (match, id, style) => {
+        fixedCount++;
+        // Fix common style issues like "position- absolute;" -> "position: absolute;"
+        const cleanStyle = style.replace('position- absolute;', 'position: absolute;');
+        return `<span id="${id}" style="${cleanStyle}"></span>`;
+    });
+
+    // Pattern 4: HTML-encoded spans with class in paragraph tags
+    // <p>&lt;span class="..."&gt;...&lt;/span&gt;</p>
+    content = content.replace(/<p>&lt;span class="([^"]*)"&gt;([^&]*)&lt;\/span&gt;<\/p>/g, (match, className, text) => {
+        fixedCount++;
+        // Remove numbering like (1), (2), (3) from highlight spans
+        let cleanText = text;
+        if (className === 'highlight') {
+            cleanText = text.replace(/^\(\d+\)\s*/, '');
+        }
+        return `<span class="${className}">${cleanText}</span>`;
+    });
 
     if (fixedCount > 0) {
         console.log(`    ✅ Fixed ${fixedCount} escaped span(s)`);
@@ -425,6 +444,115 @@ tableOfContentsAutoCollapse: true
     return content;
 }
 
+/**
+ * Fix mixed math delimiters like $`...`$ or `...`$
+ * @param {string} content - MDX content
+ * @returns {string} - Content with fixed math delimiters
+ */
+function fixMixedMathDelimiters(content) {
+    console.log('  🔧 Fixing mixed math delimiters...');
+
+    let fixedCount = 0;
+
+    // Fix patterns like $`...`$ (mixed delimiters)
+    content = content.replace(/\$`([^`]*)`\$/g, (match, mathContent) => {
+        fixedCount++;
+        return `$${mathContent}$`;
+    });
+
+    // Fix patterns like `...`$ (backtick start, dollar end)
+    content = content.replace(/`([^`]*)`\$/g, (match, mathContent) => {
+        fixedCount++;
+        return `$${mathContent}$`;
+    });
+
+    // Fix patterns like $`...` (dollar start, backtick end - less common)
+    content = content.replace(/\$`([^`]*)`(?!\$)/g, (match, mathContent) => {
+        fixedCount++;
+        return `$${mathContent}$`;
+    });
+
+    if (fixedCount > 0) {
+        console.log(`    ✅ Fixed ${fixedCount} mixed math delimiter(s)`);
+    }
+
+    return content;
+}
+
+/**
+ * Clean up orphaned math delimiters and fix mixed content
+ * @param {string} content - MDX content
+ * @returns {string} - Content with cleaned math blocks
+ */
+function cleanOrphanedMathDelimiters(content) {
+    console.log('  🧹 Cleaning orphaned math delimiters...');
+    console.log('    🔍 Content length:', content.length, 'chars');
+
+    let fixedCount = 0;
+
+    // Fix orphaned $$ that are alone on lines (but not part of display math blocks)
+    // Only remove $$ that appear alone without corresponding closing $$
+    content = content.replace(/^\$\$\s*$(?!\s*[\s\S]*?\$\$)/gm, () => {
+        fixedCount++;
+        return '';
+    });
+
+    // Fix backticks inside $$....$$ blocks (Pandoc artifact)
+    const mathMatches = content.match(/\$\$([\s\S]*?)\$\$/g);
+    console.log(`    🔍 Found ${mathMatches ? mathMatches.length : 0} math blocks`);
+
+    content = content.replace(/\$\$([\s\S]*?)\$\$/g, (match, mathContent) => {
+        // More aggressive: remove ALL single backticks in math blocks (they shouldn't be there)
+        let cleanedMath = mathContent;
+
+        // Count backticks before
+        const backticksBefore = (mathContent.match(/`/g) || []).length;
+
+        if (backticksBefore > 0) {
+            console.log(`    🔧 Found math block with ${backticksBefore} backtick(s)`);
+        }
+
+        // Remove all isolated backticks (not in pairs)
+        cleanedMath = cleanedMath.replace(/`/g, '');
+
+        const backticksAfter = (cleanedMath.match(/`/g) || []).length;
+
+        if (backticksBefore > 0) {
+            fixedCount++;
+            console.log(`    🔧 Removed ${backticksBefore} backtick(s) from math block`);
+            return `$$${cleanedMath}$$`;
+        }
+        return match;
+    });
+
+    // Fix escaped align in math blocks: \begin{align} -> \begin{align}
+    content = content.replace(/\\begin\{align\}/g, (match) => {
+        fixedCount++;
+        return '\\begin{align}';
+    });
+
+    content = content.replace(/\\end\{align\}/g, (match) => {
+        fixedCount++;
+        return '\\end{align}';
+    });
+
+    // Fix cases where text gets mixed with math blocks
+    // Pattern: ``` math ... ``` text ``` math 
+    content = content.replace(/``` math\s*\n([\s\S]*?)\n```\s*([^`\n]*?)\s*``` math/g, (match, math1, text, math2) => {
+        if (text.trim().length > 0 && !text.includes('```')) {
+            fixedCount++;
+            return '```' + ' math\n' + math1 + '\n```\n\n' + text.trim() + '\n\n```' + ' math';
+        }
+        return match;
+    });
+
+    if (fixedCount > 0) {
+        console.log(`    ✅ Fixed ${fixedCount} orphaned math delimiter(s)`);
+    }
+
+    return content;
+}
+
 /**
  * Clean newlines from single-dollar math blocks ($...$) ONLY
  * @param {string} content - MDX content
@@ -559,12 +687,11 @@ function cleanMdxSyntax(content) {
     console.log('  🧹 Cleaning MDX syntax...');
 
     return content
-        // Fix math delimiters
-        .replace(/\$`([^`]+)`\$/g, '$$$1$$')
+        // NOTE: Math delimiter fixing is now handled by fixMixedMathDelimiters()
         // Ensure proper spacing around JSX-like constructs
         .replace(/>\s*</g, '>\n<')
-        // Remove problematic heading attributes
-        .replace(/^(#{1,6}[^{]+)\{[^}]+\}$/gm, '$1')
+        // Remove problematic heading attributes - be more specific to avoid matching \begin{align}
+        .replace(/^(#{1,6}\s+[^{#\n]+)\{[^}]+\}$/gm, '$1')
         // Fix escaped quotes in text
         .replace(/\\("|')/g, '$1');
 }
@@ -586,6 +713,13 @@ function processMdxContent(content, latexContent = '') {
 
     // Apply each transformation step sequentially
     processedContent = ensureFrontmatter(processedContent, latexContent);
+    processedContent = fixMixedMathDelimiters(processedContent);
+
+    // Debug: check for $$ blocks after fixMixedMathDelimiters
+    const mathBlocksAfterMixed = (processedContent.match(/\$\$([\s\S]*?)\$\$/g) || []).length;
+    console.log(`    📊 Math blocks after mixed delimiters fix: ${mathBlocksAfterMixed}`);
+
+    processedContent = cleanOrphanedMathDelimiters(processedContent);
     processedContent = cleanSingleLineMathNewlines(processedContent);
     processedContent = formatDisplayMathBlocks(processedContent);
     processedContent = removeHtmlComments(processedContent);
diff --git a/app/scripts/latex-to-markdown/metadata-extractor.mjs b/app/scripts/latex-to-mdx/metadata-extractor.mjs
similarity index 100%
rename from app/scripts/latex-to-markdown/metadata-extractor.mjs
rename to app/scripts/latex-to-mdx/metadata-extractor.mjs
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch1/ch1-lerobot-figure1.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch1/ch1-lerobot-figure1.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch1/ch1-lerobot-figure1.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch1/ch1-lerobot-figure1.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-approaches.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-approaches.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-approaches.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-approaches.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-classical-limitations.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-classical-limitations.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-classical-limitations.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-classical-limitations.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-cost-accessibility.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-cost-accessibility.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-cost-accessibility.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-cost-accessibility.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-platforms.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-platforms.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-platforms.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-platforms.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-agent-env.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-agent-env.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-agent-env.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-agent-env.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-hil-serl-examples.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-hil-serl-examples.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-hil-serl-examples.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-hil-serl-examples.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-atlas.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-atlas.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-atlas.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-atlas.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-benefits.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-benefits.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-benefits.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-benefits.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-many-ducks.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-many-ducks.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-many-ducks.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-many-ducks.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-examples.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-examples.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-examples.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-examples.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-decoder.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-decoder.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-decoder.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-decoder.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-encoder.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-encoder.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-encoder.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-encoder.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-async-inference.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-async-inference.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-async-inference.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-async-inference.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-bc-trajectories.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-bc-trajectories.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-bc-trajectories.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-bc-trajectories.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-policy.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-policy.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-policy.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-policy.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-issues-with-bc.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-issues-with-bc.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-issues-with-bc.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-issues-with-bc.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-latent-variable-model.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-latent-variable-model.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-latent-variable-model.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-latent-variable-model.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-many-latents.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-many-latents.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-many-latents.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-many-latents.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-normalizing-flows.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-normalizing-flows.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-normalizing-flows.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-normalizing-flows.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-observation-action-mapping.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-observation-action-mapping.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-observation-action-mapping.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-observation-action-mapping.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-queues.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-queues.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-queues.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-queues.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-smolvla.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-smolvla.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-smolvla.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-smolvla.png
diff --git a/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-trends.png b/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-trends.png
similarity index 100%
rename from app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-trends.png
rename to app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-trends.png
diff --git a/app/scripts/latex-to-markdown/output/main.bib b/app/scripts/latex-to-mdx/output/main.bib
similarity index 100%
rename from app/scripts/latex-to-markdown/output/main.bib
rename to app/scripts/latex-to-mdx/output/main.bib
diff --git a/app/scripts/latex-to-markdown/output/main.md b/app/scripts/latex-to-mdx/output/main.md
similarity index 91%
rename from app/scripts/latex-to-markdown/output/main.md
rename to app/scripts/latex-to-mdx/output/main.md
index e004d496d0d2b622f0988ae2876c4e92412cb141..09244c795e617253e31bd48b79b77bd43a42c0de 100644
--- a/app/scripts/latex-to-markdown/output/main.md
+++ b/app/scripts/latex-to-mdx/output/main.md
@@ -19,7 +19,7 @@ We sincerely hope this tutorial serves as a valuable starting point for your jou
 ## Introduction
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch1/ch1-lerobot-figure1.png" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch1/ch1-lerobot-figure1.png" />
 <p>&lt;span id="figure1" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption><code>lerobot</code> is the open-source library for end-to-end robotics developed by Hugging Face. The library is vertically integrated on the entire robotics stack, supporting low-level control of real-world robot devices, advanced data and inference optimizations, as well as SOTA robot learning methods with simple implementations in pure Pytorch.</figcaption>
 </figure>
@@ -164,7 +164,7 @@ TL;DR Learning-based approaches to robotics are motivated by the need to (1) gen
 ### Explicit and Implicit Models
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-approaches.png" style="width:50.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-approaches.png" style="width:50.0%" />
 <p>&lt;span id="generating-motion-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Overview of methods to generate motion (clearly non-exhausitve, see @bekrisStateRobotMotion2024). The different methods can be grouped based on whether they explicitly (<em>dynamics-based</em>) or implicitly (<em>learning-based</em>) model robot-environment interactions.</figcaption>
 </figure>
@@ -176,7 +176,7 @@ Methods to produce robotics motion range from traditional *explicit* models--\<s
 ### Different Types of Motion
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-platforms.png" style="width-70.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-platforms.png" style="width-70.0%" />
 <p>&lt;span id="robotics-platforms-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Different kinds of motions are achieved with potentially very different robotic platforms. From left to right, top to bottom: ViperX, SO-100, Boston Dynamics’ Spot, Open-Duck, 1X’s NEO, Boston Dynamics’ Atlas. This is an example list of robotic platforms and is (very) far from being exhaustive.</figcaption>
 </figure>
@@ -194,7 +194,7 @@ Robot manipulators typically consist of a series of links and joints, articulate
 Recently, the development of low-cost manipulators like the ALOHA @zhaoLearningFineGrainedBimanual2023 ALOHA-2 @aldacoALOHA2Enhanced and SO-100/SO-101 @knightStandardOpenSO100 platforms significantly lowered the barrier to entry to robotics, considering the increased accessibility of these robots compared to more traditional platforms like the Franka Emika Panda arm (Figure <a href="#robotic-platforms-costs" data-reference-type="ref" data-reference="robotic-platforms-costs">[robotic-platforms-costs]</a>).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-cost-accessibility.png" style="width-40.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-cost-accessibility.png" style="width-40.0%" />
 <p>&lt;span id="robotic-platforms-costs" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Cheaper, more accessible robots are starting to rival traditional platforms like the Panda arm platforms in adoption in resource-constrained scenarios. The SO-100, in particular, has a cost in the 100s of Euros, and can be entirely 3D-printed in hours, while the industrially-manufactured Panda arm costs tens of thousands of Euros and is not openly available.</figcaption>
 </figure>
@@ -202,7 +202,7 @@ Recently, the development of low-cost manipulators like the ALOHA @zhaoLearning
 Deriving an intuition as per why learning-based approaches are gaining popularity in the robotics community requires briefly analyzing traditional approaches for manipulation, leveraging tools like forward and inverse kinematics (FK, IK) and control theory. Providing a detailed overview of these methods falls (well) out of the scope of this tutorial, and we refer the reader to works including @sicilianoSpringerHandbookRobotics2016, @lynchModernRoboticsMechanics2017, @tedrakeRoboticManipulationPerception, @tedrakeUnderactuatedRoboticsAlgorithms for a much more comprehensive description of these techniques. Here, we mostly wish to highlight the benefits of ML over these traditional techniques
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png" style="width:70.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-so100-to-planar-manipulator.png" style="width:70.0%" />
 <p>&lt;span id="make-so100-planar-manipulator" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The SO-100 arm is a 6-dof manipulator arm. Preventing some of its joints (shoulder pane, wrist flex and wrist roll) from actuating, it can be represented as a traditional 2-dof planar manipulator (the gripper joint in the end-effector is not considered towards the count of the degrees of freedom used to produce motion).</figcaption>
 </figure>
@@ -215,44 +215,45 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
 
 <figure>
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png" style="height-3.2cm" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-free.png" style="height-3.2cm" />
 <p>&lt;span id="planar-manipulation-simple" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Free to move</figcaption>
 </figure>
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png" style="height:3.2cm" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor.png" style="height:3.2cm" />
 <p>&lt;span id="planar-manipulator-floor" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Constrained by the surface</figcaption>
 </figure>
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png" style="height:3.2cm" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-shelf.png" style="height:3.2cm" />
 <p>&lt;span id="planar-manipulator-floor-shelf" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Constrained by surface and (fixed) obstacle</figcaption>
 </figure>
 <figcaption>Planar, 2-dof schematic representation of the SO-100 manipulator under diverse deployment settings. From left to right: completely free of moving; constrained by the presence of the surface; constrained by the surface and presence of obstacles. Circular arrows around each joint indicate the maximal rotation feasible at that joint.</figcaption>
 </figure>
 
-Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $`p \in \mathbb R^2`$ as a function of the robot’s configuration, $`p = p(q), p: \mathcal Q \mapsto \mathbb R^2`$. In particular, we have: 
-$$
-`p(q) = 
+Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $`p \in \mathbb R^2`$ as a function of the robot’s configuration, $`p = p(q), p: \mathcal Q \mapsto \mathbb R^2`$. In particular, we have: $`p(q) = 
 \begin{pmatrix}
-p_x(\theta_1, \theta_2)\\
-    p_y(\theta_1, \theta_2)
+p_x(\theta_1, \theta_2) \\  
+p_y(\theta_1, \theta_2)
 \end{pmatrix}
 =
 \begin{pmatrix}
-l \cos(\theta_1) + l \cos(\theta_1 + \theta_2)\\
-    l \sin(\theta_1) + l \sin(\theta_1 + \theta_2)
+l \cos(\theta_1) + l \cos(\theta_1 + \theta_2) \\
+l \sin(\theta_1) + l \sin(\theta_1 + \theta_2)
 \end{pmatrix}
-\in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}`
-$$
-
+\in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}`$
 
 Deriving the end-effector’s *pose*--position *and* orientation--in some $`m`$-dimensional space $`\boldsymbol{p} \in \mathcal{P} \subset \mathbb{R}^{m}`$ starting from the configuration $`{\textnormal{q}}\in \mathcal Q \subset \mathbb R^n`$ of a $`n`$-joints robot is referred to as *forward kinematics* (FK), whereas identifying the configuration corresponding to any given target pose is termed *inverse kinematics* (IK). In that, FK is used to map a robot configuration into the corresponding end-effector pose, whereas IK is used to reconstruct the configuration(s) given an end-effector pose.
 
 In the simplified case here considered (for which $`\boldsymbol{p} \equiv p`$, as the orientation of the end-effector is disregarded for simplicity), one can solve the problem of controlling the end-effector’s location to reach a goal position $`p^*`$ by solving analytically for $`q: p(q) = f_{\text{FK}}(q) = p^*`$. However, in the general case, one might not be able to solve this problem analytically, and can typically resort to iterative optimization methods comparing candidate solutions using a loss function (in the simplest case, $`\Vert p(q) - p^* \Vert_2^2`$ is a natural candidate), yielding:
 
-$`\htmlId{ik_problem}{\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .}`$
+``` math
+\begin{align}
+\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .
+
+\end{align}
+```
 
 Exact analytical solutions to IK are even less appealing when one considers the presence of obstacles in the robot’s workspace, resulting in constraints on the possible values of $`q \in \mathcal Q \subseteq [-\pi, +\pi]^n \subset \mathbb R^n`$ in the general case of $`n`$-links robots.
 
@@ -260,7 +261,13 @@ For instance, the robot in Figure <a href="#planar-manipulator-floor" data-refe
 
 However, IK--solving eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> for a feasible $`q`$--only proves useful in determining information regarding the robot’s configuration in the goal pose, and crucially does not provide information on the *trajectory* to follow over time to reach a target pose. Expert-defined trajectories obviate to this problem providing a length-$`K`$ succession of goal poses $`\tau_K = [p^*_0, p^*_1, \dots p^*_K]`$ for tracking. In practice, trajectories can also be obtained automatically through *motion planning* algorithms, thus avoiding expensive trajectory definition from human experts. However, tracking $`\tau_K`$ via IK can prove prohibitively expensive, as tracking would require $`K`$ resolutions of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> (one for each target pose). *Differential* inverse kinematics (diff-IK) complements IK via closed-form solution of a variant of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>. Let $`J(q)`$ denote the Jacobian matrix of (partial) derivatives of the FK-function $`f_\text{FK}- \mathcal Q \mapsto \mathcal P`$, such that $`J(q) = \frac{\partial f_{FK}(q)}{\partial q }`$. Then, one can apply the chain rule to any $`p(q) = f_{\text{FK}}(q)`$, deriving $`\dot p = J(q) \dot q`$, and thus finally relating variations in the robot configurations to variations in pose, thereby providing a platform for control.
 
-Given a desired end-effector trajectory $`\dot {p}^*(t)`$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $`\dot q(t)`$ solving for joints’ *velocities* instead of *configurations*, $`\htmlId{reg_ik_velocity}{\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2}`$
+Given a desired end-effector trajectory $`\dot {p}^*(t)`$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $`\dot q(t)`$ solving for joints’ *velocities* instead of *configurations*,
+``` math
+\begin{align}
+\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2
+
+\end{align}
+```
 
 Unlike eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>, solving for $`\dot q`$ is much less dependent on the environment (typically, variations in velocity are constrained by physical limits on the actuators). Conveniently, eq. <a href="#reg_ik_velocity" data-reference-type="ref" data-reference="reg_ik_velocity">[reg_ik_velocity]</a> also often admits the closed-form solution $`\dot q = J(q)^+ \dot {p}^*`$, where $`J^+(q)`$ denotes the Moore-Penrose pseudo-inverse of $`J(q)`$. Finally, discrete-time joint configurations $`q`$ can be reconstructed from joint velocities $`\dot q`$ using forward-integration on the continuous-time joint velocity , $`q_{t+1} = q_t + \Delta t\,\dot q_t`$ for a given $`\Delta t`$, resulting in tracking via diff-IK.
 
@@ -272,7 +279,7 @@ While very effective when a goal trajectory has been well specified, the perform
 
 <div class="wrapfigure">
 
-r0.3 <img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png" alt="image" />
+r0.3 <img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-planar-manipulator-floor-box.png" alt="image" />
 
 \<span id="planar-manipulator-box-velocity" style="position- absolute;"\>\</span\>
 
@@ -293,7 +300,7 @@ We point the interested reader to , , and  for extended coverage of FK, IK, di
 Despite the last 60+ years of robotics research, autonomous robots are still largely incapable of performing tasks at human-level performance in the physical world generalizing across (1) robot embodiments (different manipulators, different locomotion platforms, etc.) and (2) tasks (tying shoe-laces, manipulating a diverse set of objects). While essential in the early development of robotics, the aforementioned methods require significant human expertise to be used in practice, and are typically specific to a particular applicative problem.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch2/ch2-classical-limitations.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch2/ch2-classical-limitations.png" style="width:90.0%" />
 <p>&lt;span id="classical-limitations" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Dynamics-based approaches to robotics suffer from several limitations: (1) orchestrating multiple components poses integration challenges; (2) the need to develop custom processing pipelines for the sensing modalities and tasks considered hinders scalability; (3) simplified analytical models of physical phenomena (here friction at the gripper; credits to @antonovaReinforcementLearningPivoting2017) limit real-world performance. Lastly, (4) dynamics-based methods overlook trends in the availability and growth of robotics data.</figcaption>
 </figure>
@@ -327,7 +334,7 @@ TL;DR The need for expensive high-fidelity simulators can be obviated by learnin
 </div>
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-benefits.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-benefits.png" style="width:90.0%" />
 <p>&lt;span id="robot-learning-upsides" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Learning-based robotics streamlines perception-to-action by learning a (1) unified high-level controller capable to take (2) high-dimensional, unstructured sensorimotor information. Learning (3) does not require a dynamics model and instead focuses on interaction data, and (4) empirically correlates with the scale of the data used. </figcaption>
 </figure>
@@ -337,7 +344,7 @@ Learning-based techniques for robotics naturally address the limitations present
 Being a field at its relative nascent stages, no prevalent technique(s) proved distinctly better better in robot learning. Still, two major classes of methods gained prominence- \<span class="highlight"\>reinforcement learning (RL)\</span\> and \<span class="highlight"\>Behavioral Cloning (BC)\</span\> (Figure <a href="#robot-learning-atlas" data-reference-type="ref" data-reference="robot-learning-atlas">[robot-learning-atlas]</a>). In this section, we provide a conceptual overview of applications of the former to robotics, as well as introduce practical examples of how to use RL within `lerobot`. We then introduce the major limitations RL suffers from, to introduce BC techniques in the next sections (<a href="#learning-bc-single-sec-learning-bc-generalist" data-reference-type="ref" data-reference="learning-bc-single-sec-learning-bc-generalist">[learning-bc-single-sec-learning-bc-generalist]</a>).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-learning-atlas.png" style="width-50.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-learning-atlas.png" style="width-50.0%" />
 <p>&lt;span id="robot-learning-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Overview of the robot learning methods implemented in <code>lerobot</code>.</figcaption>
 </figure>
@@ -347,7 +354,7 @@ In Figure <a href="#robot-learning-atlas" data-reference-type="ref" data-refere
 Figure <a href="#robot-learning-atlas" data-reference-type="ref" data-reference="robot-learning-atlas">[robot-learning-atlas]</a> illustrates this categorization graphically, explicitly listing all the robot learning policies currently available in `lerobot`- Action Chunking with Transformers (ACT) @zhaoLearningFineGrainedBimanual2023, Diffusion Policy @chiDiffusionPolicyVisuomotor2024, Vector-Quantized Behavior Transformer (VQ-BeT) @leeBehaviorGenerationLatent2024, $`\pi_0`$ @blackp0VisionLanguageActionFlow2024, SmolVLA @shukorSmolVLAVisionLanguageActionModel2025, Human-in-the-loop Sample-efficient RL (HIL-SERL) @luoPreciseDexterousRobotic2024 and TD-MPC @hansenTemporalDifferenceLearning2022.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-examples.png" style="width:80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-examples.png" style="width:80.0%" />
 <p>&lt;span id="robotics-with-rl-examples" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Examples of two different robotics tasks performed using RL. In the manipulation task (A) an agent learns to reach for a yellow plastic block in its environment, and to put it inside of a box. In the locomotion task (B) an agent learns to move its center of mass sideways without falling.</figcaption>
 </figure>
@@ -359,7 +366,7 @@ Applications of RL to robotics have been long studied, to the point the relation
 The RL framework @suttonReinforcementLearningIntroduction2018, which we briefly introduce here, has often been used to model robotics problems @koberReinforcementLearningRobotics. RL is a subfield within ML fundamentally concerned with the development of autonomous systems (*agents*) learning how to *continuously behave* in an evolving environment, developing (ideally, well-performing) control strategies (*policies*). Crucially for robotics, RL agents can improve via trial-and-error only, thus entirely bypassing the need to develop explicit models of the problem dynamics, and rather exploiting interaction data only. In RL, this feedback loop (Figure <a href="#rl-most-famous-pic" data-reference-type="ref" data-reference="rl-most-famous-pic">[rl-most-famous-pic]</a>) between actions and outcomes is established through the agent sensing a scalar quantity (*reward*).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-agent-env.png" style="width:50.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-agent-env.png" style="width:50.0%" />
 <p>&lt;span id="rl-most-famous-pic" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Agent-Environment interaction diagram (image credits to @suttonReinforcementLearningIntroduction2018).</figcaption>
 </figure>
@@ -382,12 +389,14 @@ A length-$`T`$ *trajectory* is the (random) sequence
 ``` math
 \htmlId{trajectory_definition}{\tau = (s_0, a_0, r_0, s_1, a_1, r_1, \dots, s_{T-1}, a_{T-1}, r_{T-1}, s_T),}
 ```
-with per-step rewards defined as $`r_t = r (s_t, a_t, s_{t+1})`$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*: 
-$$
-`\htmlId{dynamics_markovian}{\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) = \mathbb P (s_{t+1}\vert s_t, a_t)\\
-    \mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) = \mathbb P(a_t\vert s_t)}`
-$$
- The probability of observing a given trajectory $`\tau`$ factorizes into
+with per-step rewards defined as $`r_t = r (s_t, a_t, s_{t+1})`$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*:
+``` math
+\begin{align}
+\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) &= \mathbb P (s_{t+1}\vert s_t, a_t) \\
+\mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) &= \mathbb P(a_t\vert s_t) 
+\end{align}
+```
+The probability of observing a given trajectory $`\tau`$ factorizes into
 ``` math
 \htmlId{traj_prob}{\mathbb P(\tau) = \mathbb P (s_0) \prod_{t=0}^{T-1} \mathbb P (s_{t+1}\vert s_t, a_t)\ \mathbb P(a_t\vert s_t).}
 ```
@@ -396,12 +405,13 @@ Policies $`\mathbb P(a_t\vert s_t)`$ are typically indicated as $`\pi(a_t\vert s
 ``` math
 G(\tau) = \sum_{t=0}^{T-1} \gamma^{t} r_t.
 ```
-In that, agents seek to learn control strategies (*policies*, $`\pi_\theta`$) maximizing the expected return $`\mathbb E_{\tau \sim \pi_\theta} G(\tau)`$. For a given dynamics $`\mathcal D`$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $`\Pi`$, yielding the (maximization) target $`J : \Pi \mapsto \mathbb R`$ 
-$$
-`\htmlId{RL-j-function}{J(\pi_\theta) = \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],\\
-    \mathbb P_{\theta; \mathcal D} (\tau) = \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).}`
-$$
-
+In that, agents seek to learn control strategies (*policies*, $`\pi_\theta`$) maximizing the expected return $`\mathbb E_{\tau \sim \pi_\theta} G(\tau)`$. For a given dynamics $`\mathcal D`$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $`\Pi`$, yielding the (maximization) target $`J : \Pi \mapsto \mathbb R`$
+``` math
+\begin{align}
+    J(\pi_\theta) &= \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],  \\
+    \mathbb P_{\theta; \mathcal D} (\tau) &= \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).
+\end{align}
+```
 
 Because in the RL framework the agent is assumed to only be able to observe the environment dynamics and not to intervene on them, <a href="#RL-j-function" data-reference-type="ref" data-reference="RL-j-function">[RL-j-function]</a> varies exclusively with the policy followed. In turn, MDPs naturally provide a framework to optimize over the space of the possible behaviors an agent might enact ($`\pi \in \Pi`$), searching for the *optimal policy* $`\pi^* = \arg \max_{\theta} J(\pi_\theta)`$, where $`\theta`$ is the parametrization adopted by the policy set $`\Pi: \pi_\theta \in \Pi, \ \forall \theta`$. Other than providing a target for policy search, $`G(\tau)`$ can also be used as a target to discriminate between states and state-action pairs. Given any state $`s \in \mathcal S`$--e.g., a given configuration of the robot--the *state-value* function
 ``` math
@@ -411,15 +421,18 @@ can be used to discriminate between desirable and undesirable state in terms of
 ``` math
 Q_\pi(s,a) = \mathbb E_{\tau \sim \pi} [G (\tau) \big \vert s_0 = s, a_0=a]
 ```
-Crucially, value functions are interrelated: 
-$$
-`\htmlId{q-as-v}{Q_\pi(s_t, a_t) = \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]\\
-    V_\pi(s_t) = \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]}`
-$$
- Inducing an ordering over states and state-action pairs under $`\pi`$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
+Crucially, value functions are interrelated:
+``` math
+\begin{align}
+Q_\pi(s_t, a_t) &= \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]  \\
+V_\pi(s_t) &= \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]
+
+\end{align}
+```
+Inducing an ordering over states and state-action pairs under $`\pi`$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png" style="width-40.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-rl-algorithms-atlas.png" style="width-40.0%" />
 <p>&lt;span id="rl-algos-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Popular RL algorithms. See @SpinningUp2018 for a complete list of citations.</figcaption>
 </figure>
@@ -435,7 +448,7 @@ First, especially early in training, \<span class="highlight"\>actions are typic
 Second, learning with a limited number of samples remains problematic in RL, \<span class="highlight"\>limiting the applicability of RL in real-world robotics due to consequently prohibitive timescales of training\</span\>. Even strong algorithms such as SAC @haarnojaSoftActorCriticOffPolicy2018 typically require a large numbers of transitions $`\{ (s_t, a_t, r_t, s_{t+1})\}_{t=1}^N`$. On hardware, generating these data is time-consuming and can even be prohibitive.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png" style="width:70.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-duck-sim-vs-real.png" style="width:70.0%" />
 <p>&lt;span id="synthetic-vs-real-duck" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Simulated (left) vs. real-world (right) OpenDuck. Discrepancies in the simulation dynamics (<em>reality gap</em>) pose risks to policy transfer.</figcaption>
 </figure>
@@ -443,7 +456,7 @@ Second, learning with a limited number of samples remains problematic in RL, \<s
 Training RL policies in simulation @tobinDomainRandomizationTransferring2017 addresses both issues: it eliminates physical risk and dramatically increases throughput. Yet, simulators require significant modeling effort, and rely on assumptions (simplified physical modeling, instantaneous actuation, static environmental conditions, etc.) limiting transferring policies learned in simulation due the discrepancy between real and simulated environments (*reality gap*, Figure <a href="#synthetic-vs-real-duck" data-reference-type="ref" data-reference="synthetic-vs-real-duck">[synthetic-vs-real-duck]</a>). *Domain randomization* (DR) is a popular technique to overcome the reality gap, consisting in randomizing parameters of the simulated environment during training, to induce robustness to specific disturbances. In turn, DR is employed to increase the diversity of scenarios over the course of training, improving on the chances sim-to-real transfer @akkayaSolvingRubiksCube2019, @antonovaReinforcementLearningPivoting2017, @jiDribbleBotDynamicLegged2023. In practice, DR is performed further parametrizing the *simulator*’s dynamics $`\mathcal D \equiv \mathcal D_\xi`$ with a *dynamics* (random) vector $`\xi`$ drawn an arbitrary distribution, $`\xi \sim \Xi`$. Over the course of training--typically at each episode’s reset--a new $`\xi`$ is drawn, and used to specify the environment’s dynamics for that episode. For instance, one could decide to randomize the friction coefficient of the surface in a locomotion task (Figure <a href="#ducks-on-terrains" data-reference-type="ref" data-reference="ducks-on-terrains">[ducks-on-terrains]</a>), or the center of mass of an object for a manipulation task.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-many-ducks.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-many-ducks.png" style="width:90.0%" />
 <p>&lt;span id="ducks-on-terrains" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The same locomotion task can be carried out in different (simulated) domains (exemplified by the difference in terrains) at training time, resulting to increased robustness over diverse environment dynamics.</figcaption>
 </figure>
@@ -479,15 +492,17 @@ Q_{i+1}(s_t, a_t) \leftarrow \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t
 ```
 Then, one can derive the (ideally, near-optimal) policy by explicitly maximizing over the action space the final (ideally, near-optimal) estimate $`Q_K \approx Q^*`$ at each timestep. In fact, under certain assumptions on the MDP considered, $`Q_K \to Q^* \, \text{as } K \to \infty`$.
 
-Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $`\mathcal S\times \mathcal A`$ problems, in which the storing of $`Q : \mathcal S\times \mathcal A\mapsto \mathbb R`$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $`\theta`$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $`\delta_i`$): 
-$$
-`\htmlId{dqn-loss}{\mathcal L(\theta_i) = \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} 
+Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $`\mathcal S\times \mathcal A`$ problems, in which the storing of $`Q : \mathcal S\times \mathcal A\mapsto \mathbb R`$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $`\theta`$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $`\delta_i`$):
+``` math
+\begin{align}
+\mathcal L(\theta_i) &= \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} 
     \big[ 
         (\underbrace{y_i - Q_{\theta_i}(s_t, a_t)}_{\delta_i})^2 
-    \big],\\
-    y_i = \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big],}`
-$$
- Where $`\chi`$ represents a behavior distribution over state-action pairs. Crucially, $`\chi`$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $`(s_t, a_t, r_t, s_{t+1})`$ transitions, used to form the TD-target $`y_i`$, TD-error $`\delta_i`$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
+    \big],  \\
+    y_i &= \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big], 
+\end{align}
+```
+Where $`\chi`$ represents a behavior distribution over state-action pairs. Crucially, $`\chi`$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $`(s_t, a_t, r_t, s_{t+1})`$ transitions, used to form the TD-target $`y_i`$, TD-error $`\delta_i`$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
 
 While effective in handling large, unstructured state spaces for discrete action-space problems, DQN application’s to continous control problems proved challenging. Indeed, in the case of high-capacity function approximators such as neural networks, solving $`\max_{a_t \in \mathcal A} Q_\theta(s_t, a_t)`$ at each timestep is simply unfeasible due to the (1) continous nature of the action space ($`\mathcal A\subset \mathbb R^n`$ for some $`n`$) and (2) impossibility to express the find a cheap (ideally, closed-form) solution to $`Q_\theta`$.  @silverDeterministicPolicyGradient2014 tackle this fundamental challenge by using a *deterministic* function of the state $`s_t`$ as policy, $`\mu_\phi(s_t) = a_t`$, parametrized by $`\phi`$. Thus, policies can be iteratively refined updating $`\phi`$ along the direction:
 ``` math
@@ -499,7 +514,13 @@ Provably, <a href="#deterministic-pg" data-reference-type="ref" data-reference="
 ```
 Similarily to DQN, DDPG also employs the same replay buffer mechanism, to reuse past transitions over training for increased sample efficiency and estimate the loss function via MC-estimates.
 
-Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with \<span class="highlight"\>maximizing the discounted cumulative reward, while acting as randomly as possible\</span\>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $`J (\pi)`$ to specifically account for the policy entropy, $`\htmlId{J-soft}{J(\pi) = \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))]}`$ This modified objective results in the *soft* TD-target:
+Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with \<span class="highlight"\>maximizing the discounted cumulative reward, while acting as randomly as possible\</span\>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $`J (\pi)`$ to specifically account for the policy entropy,
+``` math
+\begin{align}
+    J(\pi) &= \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))] 
+\end{align}
+```
+This modified objective results in the *soft* TD-target:
 ``` math
 \htmlId{soft-td-target}{y_i = \mathbb E_{s_{t+1} \sim \mathbb P( \bullet \vert s_t, a_t)} [r_t + \gamma \left( Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) - \alpha \log \pi_\phi(a_{t+1} \vert s_{t+1}) \right)], \quad a_{t+1} \sim \pi_\phi(\bullet \vert s_t)}
 ```
@@ -522,7 +543,7 @@ Despite the possibility to leverage offline data for learning, the effectiveness
 Lastly, in order to improve on the robustness of their approach to different goals while maintaing practical scalability, @luoSERLSoftwareSuite2025 introduced a modified state and action space, expressing proprioperceptive configurations $`q`$ and actions $`\dot q`$ in the frame of end-effector pose at $`t=0`$. Randomizing the initial pose of the end-effector ($`s_0`$),@luoSERLSoftwareSuite2025 achieved a similar result to that of having to manually randomize the environment at every timestep, but with the benefit of maintaining the environment in the same condition across multiple training episodes, achieving higher scalability of their method thanks to the increased practicality of their approach.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch3/ch3-hil-serl-examples.png" style="width:80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch3/ch3-hil-serl-examples.png" style="width:80.0%" />
 <p>&lt;span id="hil-serl-blocks" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>(A) HIL-SERL allows for real-world training of high performance RL agents by building on top advancements presented by of SAC, RLPD and SERL. (B) Example of human intervention during a HIL-SERL training process on a SO-100.</figcaption>
 </figure>
@@ -564,7 +585,7 @@ TL;DR Behavioral Cloning provides a natural platform to learn from real-world in
 </div>
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-bc-trajectories.png" style="width:80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-bc-trajectories.png" style="width:80.0%" />
 <p>&lt;span id="ch4-bc-trajectories" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>(A) Average (with standard deviation) evolution of the actuation levels over the first 5 recorded episodes in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Proprioperceptive state provide invaluable to determine the robot’s state during an episode. (B) Camera frames are also recorded alongside measurements on the robot’s state, capturing information about the robot’s interaction with its environment.</figcaption>
 </figure>
@@ -574,7 +595,7 @@ Learning from human demonstrations provides a pragmatic alternative to the reinf
 Formally, let $`\mathcal D = \{ \tau^{(i)} \}_{i=1}^N`$ be a set of expert trajectories, with $`\tau^{(i)} = \{(o_t^{(i)}, a_t^{(i)})\}_{t=0}^{T_i}`$ representing the $`i`$-th trajectory in $`\mathcal D`$, $`o_t \in \mathcal O`$ denoting observations (e.g., images and proprioception altogether), and $`a_t \in \mathcal A`$ the expert actions. Typically, observations $`o \in \mathcal O`$ consist of both image and proprioperceptive information, while actions $`a \in \mathcal A`$ represent control specifications for the robot to execute, e.g. a joint configuration. Note that differently from Section <a href="#learning-rl" data-reference-type="ref" data-reference="learning-rl">[learning-rl]</a>, in the imitation learning context $`\mathcal D`$ denotes an offline dataset collecting $`N`$ length-$`T_i`$ reward-free (expert) human trajectories $`\tau^{(i)}`$, and *not* the environment dynamics. Similarily, in this section $`\tau^{(i)}`$ represent a length-$`T_i`$ trajectory of observation-action pairs, which crucially *omits entirely any reward* information. Figure <a href="#ch4-bc-trajectories" data-reference-type="ref" data-reference="ch4-bc-trajectories">[ch4-bc-trajectories]</a> graphically shows trajectories in terms of the average evolution of the actuation on the 6 joints over a group of teleoperated episodes for the SO-100 manipulator. Notice how proprioperceptive states are captured jointly with camera frames over the course of the recorded episodes, providing a unified high-frame rate collection of teleoperation data. Figure <a href="#ch4-observation-action-mapping" data-reference-type="ref" data-reference="ch4-observation-action-mapping">[ch4-observation-action-mapping]</a> shows $`(o_t, a_t)`$-pairs for the same dataset, with the actions performed by the human expert illustrated just alongside the corresponding observation. In principle, (expert) trajectories $`\tau^{(i)}`$ can have different lengths since demonstrations might exhibit multi-modal strategies to attain the same goal, resulting in possibly multiple, different behaviors.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-observation-action-mapping.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-observation-action-mapping.png" style="width:90.0%" />
 <p>&lt;span id="ch4-observation-action-mapping" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Sample observations and action pairs over the course of a given trajectory recorded in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Observations, comprising of both proprioperceptive and visual information, are recorded alongside the configuration of a second, leader robot controlled by a human expert, providing complete information for regressing actions given observation.</figcaption>
 </figure>
@@ -590,7 +611,7 @@ Typically, the expert’s joint observation-action distribution $`p: \mathcal O\
 Despite the inherent challenges of learning on non-i.i.d. data, the BC formulation affords several operational advantages in robotics. First, training happens offline and typically uses expert human demonstration data, hereby severily limiting exploration risks by preventing the robot from performing dangerous actions altogether. Second, reward design is entirely unnecessary in BC, as demonstrations already reflect human intent and task completion. This also mitigates the risk of misalignment and specification gaming (*reward hacking*), otherwise inherent in purely reward-based RL @heessEmergenceLocomotionBehaviours2017. Third, because expert trajectories encode terminal conditions, success detection and resets are implicit in the dataset. Finally, BC scales naturally with growing corpora of demonstrations collected across tasks, embodiments, and environments. However, BC can in principle only learn behaviors that are, at most, as good as the one exhibited by the demonstrator, and thus critically provides no mitigation for the suboptimal decision making that might be enaced by humans. Still, while problematic in sequential-decision making problems for which expert demonstrations are not generally available--data migth be expensive to collect, or human performance may be inherently suboptimal--many robotics applications benefit from relative cheap pipelines to acquire high-quality trajectories generated by humans, thus justifying BC approaches.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-issues-with-bc.png" style="width:80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-issues-with-bc.png" style="width:80.0%" />
 <p>&lt;span id="ch4-issues-with-bc" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Point-wise policies suffer from limitations due to (A) covariate shifts and poor approximation of (B) multimodal demonstrations. (A) Initially small errors may drive the policy out of distribution, incuring in a vicious circle ultimately resulting in failure. (B) Both modes of reaching for a target object in a scene, either left or right-first, are equally as good and thus equally as likely to be present in a dataset of human demonstrations, ultimately resulting in multimodal demonstrations.</figcaption>
 </figure>
@@ -604,7 +625,7 @@ Generative Models (GMs) aim to learn the stochastic process underlying the very
 #### Variational Auto-Encoders
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png" style="width-80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-task-effect-on-pairs.png" style="width-80.0%" />
 <p>&lt;span id="ch4-task-effect-on-pairs" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Intuitively, latent variable in a single latent model may contain information regarding the task being performed, which directly results in the likelihood of the same observation-action pair being different for two different tasks. When (A) picking a block the likelihood of a wide gripper’s opening should be higher than narrower one, while it should be the opposite when (B) pushing the block.</figcaption>
 </figure>
@@ -616,49 +637,60 @@ A common inductive bias used in GM posits samples $`(o,a)`$ are influenced from
 Intuitively, in the case of observation-action pairs $`(o, a)`$ for a robotics application, $`z`$ could be some high level representation of the underlying task being performed by the human demonstrator. In such case, treating $`p(o,a)`$ as a marginalization over $`\text{supp}({Z})`$ of the complete joint distribution $`p(o,a,z)`$ natively captures the effect different tasks have on the likelihood of observation-action pairs. Figure <a href="#ch4-task-effect-on-pairs" data-reference-type="ref" data-reference="ch4-task-effect-on-pairs">[ch4-task-effect-on-pairs]</a> graphically illustrates this concept in the case of a (A) picking and (B) pushing task, for which, nearing the target object, the likelihood of actions resulting in opening the gripper--the higher $`q_6`$, the wider the gripper’s opening--should intuitively be (A) high or (B) low, depending on the task performed. While the latent space $`Z`$ typically has a much richer structure than the set of all actual tasks performed, <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> still provides a solid framework to learn joint distribution conditioned on unobservable yet relevant factors. Figure <a href="#ch4-latent-variable-model" data-reference-type="ref" data-reference="ch4-latent-variable-model">[ch4-latent-variable-model]</a> represents this framework of latent-variable for a robotics application- the true, $`z`$-conditioned generative process on assigns *likelihood* $`p((o,a) \vert z)`$ to the single $`(o,a)`$-pair. Using Bayes’ theorem, one can reconstruct the *posterior* distribution on $`\text{supp}({Z})`$, $`q_\theta(z \vert o,a)`$ from the likelihood $`p_\theta(o,a \vert z)`$, *prior* $`p_\theta(z)`$ and *evidence* $`p_\theta(o,a)`$. VAEs approximate the latent variable model presented in <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>) using an *approximate posterior* $`q_\phi(z \vert o,a)`$ while regressing parameters for a parametric likelihood, $`p_\theta(o,a \vert z)`$ (Figure <a href="#ch4-latent-variable-model" data-reference-type="ref" data-reference="ch4-latent-variable-model">[ch4-latent-variable-model]</a>).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-latent-variable-model.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-latent-variable-model.png" style="width:90.0%" />
 <p>&lt;span id="ch4-latent-variable-model" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>(A) The latent variable model in a robotics application regulates influence between observed (<span class="math inline"><em>o</em>, <em>a</em>)</span> variables and an unobservable latent variable. (B) VAEs approximate exact latent variable models by means of variational inference. </figcaption>
 </figure>
 
-Given a dataset $`\mathcal D`$ consisting of $`N`$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $`\theta`$ (in Bayesian terms, the *evidence* $`p_\theta(\mathcal D)`$) can thus be written as: 
-$$
-`\htmlId{evidence-definition-1}{\log p_\theta(\mathcal D) = \log \sum_{i=0}^N p_\theta ((o,a)_i)\\
-    = \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z)\\
-    = \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z)\\
-    = \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)],}`
-$$
- where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $`1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}`$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
+Given a dataset $`\mathcal D`$ consisting of $`N`$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $`\theta`$ (in Bayesian terms, the *evidence* $`p_\theta(\mathcal D)`$) can thus be written as:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &= \log \sum_{i=0}^N p_\theta ((o,a)_i) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)], 
+\end{align}
+```
+where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $`1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}`$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
 
 In the special case where one assumes distributions to be tractable, $`p_\theta (\mathcal D)`$ is typically tractable too, and $`\max_\theta \log p_\theta(\mathcal D)`$ provides a natural target for (point-wise) infering the unknown parameters $`\theta`$ of the generative model. Unfortunately, <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> is rarely tractable when the distribution $`p`$ is modeled with approximators such as neural networks, especially for high-dimensional, unstructured data.
 
 In their seminal work on Variational Auto-Encoders (VAEs), @kingmaAutoEncodingVariationalBayes2022 present two major contributions to learn complex latent-variable GMs on unstructured data, proposing (1) a tractable, variational lower-bound to <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> as an optimization target to jointly learn likelihood and posterior and (2) high-capacity function approximators to model the likelihood $`p_\theta(o,a\vert z)`$ and (approximate) posterior distribution $`q_\phi(z \vert o,a) \approx q_\theta(z \vert o,a)`$.
 
-In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$`\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]`$--yielding: 
-$$
-`\htmlId{ELBO-intractable}{\log p_\theta(\mathcal D) \geq \sum_{i=0}^{N} \left(
+In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$`\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]`$--yielding:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &\geq \sum_{i=0}^{N} \left(
             \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
             + \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} [\log \left( \frac{p(z)}{q_\theta(z \vert (o,a)_i)} \right)]
-        \right)\\
-    = \sum_{i=0}^{N} \left(
+        \right) \\
+        &= \sum_{i=0}^{N} \left(
             \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
         - \text{D}_{\text{KL}}\big[ q_\theta(z \vert (o,a)_i) \Vert p(z) \big]
-        \right)}`
-$$
- The true, generally intractable posterior $`p_\theta (z \vert o,a)`$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $`q_\phi(z \vert o,a)`$, resulting in the final, tractable ELBO objective, $`\htmlId{ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left(
+        \right) 
+\end{align}
+```
+The true, generally intractable posterior $`p_\theta (z \vert o,a)`$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $`q_\phi(z \vert o,a)`$, resulting in the final, tractable ELBO objective,
+``` math
+\begin{align}
+\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left(
             \mathbb{E}_{z \sim q_\phi(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
         - \text{D}_{\text{KL}}\big[ q_\phi(z \vert (o,a)_i) \Vert p(z) \big]
-        \right)}`$ From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $`q_\phi`$ as a Gaussian $`q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)`$ and (2) imposing a standard Gaussian prior on the latent space, $`p(z) = \mathcal N(\mathbf{0}, \mathbf{I})`$.
+        \right)
+        
+\end{align}
+```
+From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $`q_\phi`$ as a Gaussian $`q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)`$ and (2) imposing a standard Gaussian prior on the latent space, $`p(z) = \mathcal N(\mathbf{0}, \mathbf{I})`$.
 
 An intuitive explanation of the learning dynamics of VAEs can be given considering the equivalent case of *minimizing the negative ELBO*, which admits a particularly interpretable factorization
 
-
-$$
-`\htmlId{VAE-min-neg-ELBO}{\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) = \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi)\\
-    \mathbf{L^{\text{rec}}}(\theta) = \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]\\
-    \mathbf{L^{\text{reg}}}(\phi) = \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big]}`
-$$
-
+``` math
+\begin{align}
+\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) &= \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi) \\
+\mathbf{L^{\text{rec}}}(\theta) &= \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]  \\
+\mathbf{L^{\text{reg}}}(\phi) &= \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big] 
+\end{align}
+```
 
 For any given $`(o,a)`$ pair, the expected value term of <a href="#VAE-Lrec" data-reference-type="ref" data-reference="VAE-Lrec">[VAE-Lrec]</a> is typically computed via MC estimates, resulting in
 ``` math
@@ -672,15 +704,17 @@ Indeed, it is very common in practice to approximate from the learned likelihood
 
 #### Diffusion Models
 
-VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $`p_\theta`$ and (approximate) posterior $`q_\phi`$ for such model. In that, the unknown data distribution $`p(o,a)`$ is effectively approximated via $`\int_Z p(z) p_\theta(o,a \vert z)`$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $`p(o,a)`$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $`o,a`$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in 
-$$
-`\htmlId{BC-multi-latent-model-1}{p(\underbrace{o,a}_{= z_0}) = \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)\\
-    p(z_0, z_1, \dots z_T) = p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t),}`
-$$
- where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
+VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $`p_\theta`$ and (approximate) posterior $`q_\phi`$ for such model. In that, the unknown data distribution $`p(o,a)`$ is effectively approximated via $`\int_Z p(z) p_\theta(o,a \vert z)`$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $`p(o,a)`$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $`o,a`$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in
+``` math
+\begin{align}
+    p(\underbrace{o,a}_{= z_0}) &= \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)  \\ 
+    p(z_0, z_1, \dots z_T) &= p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t), 
+\end{align}
+```
+where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-many-latents.png" style="width-50.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-many-latents.png" style="width-50.0%" />
 <p>&lt;span id="ch4-many-latents" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>HMLV models posit the data generation process is influenced by a stack of Markov-dependent latent variables, with samples from the posterior distribution being progressively higher up in the hierarchy.</figcaption>
 </figure>
@@ -689,19 +723,21 @@ Similarily to VAEs, providing an exact interpretation for the latent variables i
 
 Just like VAEs, DMs attemp to learn to reproduce an underlying data distribution $`p (o,a)`$ given a collection of i.i.d. samples approximating the model posited to have generated the data in the first place ( <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>). Similarily to VAEs, DMs approximate the process of sampling from the unknown $`p(o,a)`$ (1) sampling from an easy-to-sample distribution (e.g., Gaussian) and (2) learning to reconstruct high-likelihood samples under the unknown distribution. However, in stark contrast with VAEs, the easy-to-sample distribution contains *no mutual information* regarding the data distribution $`p(o,a)`$. Crucially, as no information from the sample $`(o,a)`$ (denoted as $`z_0 \equiv (o,a)`$ for the sake of notation) is assumed to be propagated throughout the chain of latents, the posterior $`q(z_t \vert z_{t-1})`$ assumes a relatively amicable structure in DMs, reducing complexity. The *true* likelihood $`p(z_{t-1} \vert z_t)`$ is instead typically approximated using the parametrization $`p_\theta (z_{t-1} \vert z_t)`$. In that, the information contained in the unknwon data distribution is *reconstructed* via a process in which samples from a fixed distribution are turned into (ideally) high-likelihood samples under $`p(o,a)`$--a process referred to as *denoising*.
 
-Under such model, we can express the log-likelihood of an arbitrary sample as[^4] 
-$$
-`\htmlId{diffusion-likelihood}{\log p_\theta (\underbrace{o,a}_{= z_0}) = 
-    \mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -\\
-    \mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag\\
-    \sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag}`
-$$
- providing an optimization target in the form of $`\max_\theta \log p_\theta (\mathcal D)`$.
+Under such model, we can express the log-likelihood of an arbitrary sample as[^4]
+``` math
+\begin{align}
+    \log p_\theta (\underbrace{o,a}_{= z_0}) = 
+    &\mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -  \\
+    &\mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag \\ 
+    &\sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag
+\end{align}
+```
+providing an optimization target in the form of $`\max_\theta \log p_\theta (\mathcal D)`$.
 
 In their seminal work on using DMs for variational inference, @hoDenoisingDiffusionProbabilistic2020 introduce major contributions regarding solving $`\min_\theta -\log p_\theta(o,a)`$. In particular, @hoDenoisingDiffusionProbabilistic2020 exclusively adopt a fixed *Gaussian* posterior in the form of $`q(z_t \vert z_{t-1}) = \mathcal{N}(\sqrt{1-\beta_t}z_{t-1}, \beta_t \mathbf I)`$. The choice of adopting Gaussians has profound implications on the generative process modeled. Indeed, under the (mild) assumption that the variance is sufficiently small $`\beta_t \leq \eta, \eta \in \mathbb R^+`$, @sohl-dicksteinDeepUnsupervisedLearning2015 proved that the likelihood $`p(z_{t-1} \vert z_t)`$ is Gaussian as well, which allows for the particularly convenient parametrization of the approximate likelihood $`p_\theta (x_{t-1} \vert x_t) = \mathcal N(\mu_\theta(x_t, t), \Sigma_\theta(x_t,t)), \ t \in [1,T]`$, as well as for closed-form tractability of the KL-divergence terms in <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a>. Further, the posterior’s structure also enables an analytical description for the distribution of the $`t`$-th latent variable, $`q(z_t \vert z_0) = \mathcal N (\sqrt{\bar{\alpha}_t}z_0, (1-\bar{\alpha}_t) \mathbf{I})`$, with $`\alpha_t = 1-\beta_t, \ \bar \alpha_t = \prod_{k=1}^t \alpha_k`$, which conveniently prevents iterative posterior sampling.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png" style="width-90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-robot-actions.png" style="width-90.0%" />
 <p>&lt;span id="diffusion-robot-actions" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>DMs iteratively corrupt samples (left) from an unknown distribution into a quasi-standard Gaussian (center), learning the displacement field (right) that permits to reconstruct samples from the unknown target distribution by iteratively denoising samples of a tractable, easy-to-sample distribution.</figcaption>
 </figure>
@@ -709,30 +745,43 @@ In their seminal work on using DMs for variational inference, @hoDenoisingDiffu
 Finally, adopting Gaussian posteriors permits a particularly pleasing interpretation of the dynamics of training DMs @permenterInterpretingImprovingDiffusion2024. By using Gaussian posteriors, the hierarchical latent variables effectively lose increasingly more information circa the original (unknown) distribution’s sample, $`z_0`$, increasingly distributing according to a standard Gaussian and thus containing no information at all (Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>). Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a> illustrates this procedure on a simplified, bidimensional observation-action distribution, where we considered $`o=q_2`$ and $`a=q^h_2`$, with $`q_2`$ representing the robot’s *elbow flex* actuation and $`q^h_2`$ the human teleoperator’s robot elbow flex.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png" style="width-30.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-action-vs-observation-distribution.png" style="width-30.0%" />
 <p>&lt;span id="ch4-action-vs-observation-distribution" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>A joint action-observation distribution, in the simplified case where the observation is the elbow-flex actuation in a SO-100, and the action is the recorded position for the same joint in the teleoperator arm. The motion recorded being teleoperated, the points distribute along a the diagonal.</figcaption>
 </figure>
 
-Because the recorded behavior is teleoperated, measurements mostly distribute along the line $`a = o + \eta, \eta \sim N(0,1)`$, with $`\eta`$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $`\mathcal O\times \mathcal A`$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective: $`\htmlId{diffusion-simplified-loss}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[
+Because the recorded behavior is teleoperated, measurements mostly distribute along the line $`a = o + \eta, \eta \sim N(0,1)`$, with $`\eta`$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $`\mathcal O\times \mathcal A`$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective:
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[
         \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} z_0 + \epsilon \sqrt{1 - \bar \alpha_t}, t) \Vert^2 \big], \quad t \sim \mathcal{U}(\{1,\dots,T\}), \quad
         z_0 \sim \mathcal{D}, \quad
-        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).}`$
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).
+\end{align}
+```
 
 In this simplified (minimization) objective, the optimization process differs from <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a> in that, rather than maxizing $`p_\theta`$ directly, the parameters $`\theta`$ of the pairwise likelihood $`p_\theta(z_{t-1} \vert z_t)`$ are adjusted to *predict the total displacement* $`\epsilon`$ for a randomly long ($`t \sim \mathcal{U}(\{1,\dots,T\}`$ )) diffusion process starting from a sample of the target distribution.
 
-By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($`\Vert \epsilon \Vert > 0`$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $`p_\theta (z_{t-1} \vert z_t)`$ is Gaussian, then sampling $`z_{t-1} \sim p_\theta(\bullet \vert z_{t})`$ corresponds to computing $`\htmlId{diffusion-denoising-definition}{z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}),}`$ thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $`\epsilon_\theta(z_t, t)`$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
+By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($`\Vert \epsilon \Vert > 0`$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $`p_\theta (z_{t-1} \vert z_t)`$ is Gaussian, then sampling $`z_{t-1} \sim p_\theta(\bullet \vert z_{t})`$ corresponds to computing
+``` math
+\begin{align}
+    z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}), 
+\end{align}
+```
+thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $`\epsilon_\theta(z_t, t)`$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
 
 #### Flow Matching
 
 \<span id="ch4-flow-matching" style="position: absolute;"\>\</span\>
 
-The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $`\psi [0,1] \times Z \mapsto Z`$, formalized starting from possibly time-dependent vector field $`v: [0,1] \times Z \mapsto Z`$ transporting samples from a simple prior distribution $`p_0`$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $`p_1`$ over time. Note how FM models time $`t \in [0,1]`$ to be varying continuously while moving away *from* an easy-to-sample distribution $`p_0`$ *towards* the unknown data-distribution, $`p_1`$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time, 
-$$
-`\frac{d}{dt} \psi(z, t) = v(t, \psi(t, z))\\
-    \psi(0, z) = z`
-$$
-
+The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $`\psi [0,1] \times Z \mapsto Z`$, formalized starting from possibly time-dependent vector field $`v: [0,1] \times Z \mapsto Z`$ transporting samples from a simple prior distribution $`p_0`$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $`p_1`$ over time. Note how FM models time $`t \in [0,1]`$ to be varying continuously while moving away *from* an easy-to-sample distribution $`p_0`$ *towards* the unknown data-distribution, $`p_1`$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time,
+``` math
+\begin{align}
+    \frac{d}{dt} \psi(z, t) &= v(t, \psi(t, z)) \\
+    \psi(0, z) &= z
+\end{align}
+```
 
 FM proved very effective in a variety of applications, ranging from image @esserScalingRectifiedFlow2024 and video generation @polyakMovieGenCast2025 to robotics control @blackp0VisionLanguageActionFlow2024. Most notably, in their introductory work on FM for GM, @lipmanFlowMatchingGenerative2023 show how DMs can be seen as a specific instance of FM where the *conditional* target vector field $`u`$ approximated by the noise regressor corresponds to
 ``` math
@@ -741,7 +790,7 @@ FM proved very effective in a variety of applications, ranging from image @esse
 Note that the traditional discrete-time noise-scheduler $`{\beta_t}_{t=0}^T`$ is now generalized to a continuous map $`\beta : [0,1] \mapsto \mathbb R^+`$. Crucially, @lipmanFlowMatchingGenerative2023 prove that by exclusively optimizing the vector field for individual data points $`z_0 \in \mathcal D`$ individually, one also retrieves the optimal flow to morph the entire support of the initial distribution $`p_0`$ into $`p_1 \ \text{s.t.} \mathcal D \sim p_1`$.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-normalizing-flows.png" style="width:80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-normalizing-flows.png" style="width:80.0%" />
 <p>&lt;span id="ch4-normalizing-flows" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Probability distributions can be modified applying vector fields resulting in a flow of mass in the support. When acting over time, vector fields can effectively change the distribution’s structure.</figcaption>
 </figure>
@@ -749,13 +798,20 @@ Note that the traditional discrete-time noise-scheduler $`{\beta_t}_{t=0}^T`$ is
 While the noising schedule of DMs results in a stochastic process that resembles a random walk, FM allows for more general--potentially, deterministic--likelihood and posterior parametrization. In the FM literature the likelihood and posterior probabilty densities defined along a HMLV model are typically jointly referred to as a *probability path*, where the distributions for successive adjacent transitions in the HMLV model are related by the (normalized) flow between them (Figure <a href="#ch4-normalizing-flows" data-reference-type="ref" data-reference="ch4-normalizing-flows">[ch4-normalizing-flows]</a>). The inherent flexibility of FM is one of their key advantages over DMs, as it opens up the possibility of *learning* more efficient paths. For instance, one can design probability paths inspired by Optimal Transport (OT)--a subdiscipline studying the problem of finding the most efficient way to morph one probability distribution into another. Probability paths obtained through OT paths tend to be *straighter* than diffusion paths (Figure <a href="#ch4-diffusion-paths-versus-fm" data-reference-type="ref" data-reference="ch4-diffusion-paths-versus-fm">[ch4-diffusion-paths-versus-fm]</a>), which can lead to faster and more stable training, as well as higher-quality sample generation with fewer steps at inference time. By avoiding unnecessary backtracking associated with the inherent stochastic nature of both the noising and denoising process in DMs, test-time compute is typically significantly reduced, while retaining comparable results @lipmanFlowMatchingGenerative2023.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-vs-flowmatching.png" />
 <p>&lt;span id="ch4-diffusion-paths-versus-fm" style="position- absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Compared to diffusion, flow matching distorts distribution along a less randomic pattern, resulting in a clearer interpolation between source and target distribution. The visualization shows an example comparison between these two methods on joint distribution of robot observations and actions over <span class="math inline"><em>T</em> = 50</span> steps.</figcaption>
 </figure>
 
-In practice, FM can be applied to generative modeling by learning a vector field regressor $`v_\theta(z, t)`$ to approximate a given target vector field $`u(t, z)`$. In the particular case of DMs, $`u(t, z)`$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $`z_1 \sim p_1`$ and a sample from an easy-to-sample prior $`z_0 \sim p_0`$, CFM defines a simple path between them using *linear interpolation* between samples $`z_t = (1-t)z_0 + t z_1`$, resulting in the target vector field $`u(t, z_t) = z_1 - z_0`$. Then, a FM model can be trained with the simple regression objective defined as $`\htmlId{flow-matching-objective}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[
-        \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),}`$ where $`z_0 \sim p_0(\bullet)`$ and $`z_1 \sim p_1(\bullet)`$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $`t \sim \mathcal U([0,1])`$ rather than discretely $`t \sim \mathcal U(\{0,1\})`$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $`z_0 \sim p_0`$ and iteratively refined according to $`\frac{dz}{dt} = v_\theta(z_t, t)`$ for $`t \in [0,1]`$--an operation that can be numerically carried out with standard ODE solvers.
+In practice, FM can be applied to generative modeling by learning a vector field regressor $`v_\theta(z, t)`$ to approximate a given target vector field $`u(t, z)`$. In the particular case of DMs, $`u(t, z)`$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $`z_1 \sim p_1`$ and a sample from an easy-to-sample prior $`z_0 \sim p_0`$, CFM defines a simple path between them using *linear interpolation* between samples $`z_t = (1-t)z_0 + t z_1`$, resulting in the target vector field $`u(t, z_t) = z_1 - z_0`$. Then, a FM model can be trained with the simple regression objective defined as
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[
+        \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),
+\end{align}
+```
+where $`z_0 \sim p_0(\bullet)`$ and $`z_1 \sim p_1(\bullet)`$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $`t \sim \mathcal U([0,1])`$ rather than discretely $`t \sim \mathcal U(\{0,1\})`$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $`z_0 \sim p_0`$ and iteratively refined according to $`\frac{dz}{dt} = v_\theta(z_t, t)`$ for $`t \in [0,1]`$--an operation that can be numerically carried out with standard ODE solvers.
 
 ### Action Chunking with Transformers
 
@@ -763,15 +819,22 @@ While GMs prove useful in learning complex, high-dimensional multi-modal distrib
 
 On the robot learning side of their contributions, @zhaoLearningFineGrainedBimanual2023 adopt transformers as the architectural backbone to learn a *Conditional* VAE @sohnLearningStructuredOutput2015. Conditional VAEs are a variation of the more standard VAE formulation introducing a conditioning variable on sampling from the latent prior, allowing the modeling of *one-to-many* relationships between latent and data samples. Further, in stark contrast with previous work @florenceImplicitBehavioralCloning2022, @jannerPlanningDiffusionFlexible2022, @zhaoLearningFineGrainedBimanual2023 do not learn a full joint $`p_\theta(o,a)`$ on observation and actions. While the *policy* distribution $`p_\theta(a \vert o)`$ can in principle be entirely described from its joint $`p_\theta(o,a)`$, it is often the case that the conditional distribution is intractable when using function approximators, as $`p_\theta(a \vert o) = \tfrac{p_\theta(o,a)}{\int_\mathcal Ap_\theta(o,a)}`$ and the integral in the denominator is typically intractable. Instead of modeling the full joint using a vanilla VAE, @zhaoLearningFineGrainedBimanual2023 propose learning a *conditional* VAE @sohnLearningStructuredOutput2015 modeling the policy distribution directly $`p (a \vert o)`$.
 
-In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to $`\htmlId{c-ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left(
+In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to
+``` math
+\begin{align}
+
+    \text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left(
             \mathbb{E}_{z \sim q_\phi(\cdot \vert o_i, a_i)} \big[ \log p_\theta(a_i \vert z, o_i) \big]
         - \text{D}_{\text{KL}}\big[ q_\phi(z \vert o_i, a_i) \Vert p_\omega(z \vert o_i) \big]
-        \right)}`$ Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $`\omega`$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $`\beta`$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $`\beta`$ results in a less expressive latent space.
+        \right)
+\end{align}
+```
+Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $`\omega`$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $`\beta`$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $`\beta`$ results in a less expressive latent space.
 
 In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn from human demonstrations compared to a simpler, supervised objective, $`\mathcal L_1(a,a^\prime) = \Vert a - a^\prime \Vert_1`$. Interestingly, they found the performance of these two approaches to be comparable when learning from *scripted* demonstrations. That is, when learning from data collected rolling out a predetermined set of commands $`[q^c_0, q^c_1, \dots]`$, GM did *not* prove competitive compared to standard supervised learning. However, when learning from human demonstrations--i.e., from data collected executing commands coming from a human controller $`[q^h_0, q^h_1, \dots]`$--they found performance (success rate on a downstream task) to be severily (-33.3%) hindered from adopting a standard supervised learning objective compared to a richer, potentially more complex to learn variational objective, in keeping with the multimodal nature of human demonstrations data and findings presented in @florenceImplicitBehavioralCloning2022. The authors also ablate the action chunking paradigm, reporting significant performance gains for performing action chunking (1% vs. 44% success rate). To avoid acting openloop, @zhaoLearningFineGrainedBimanual2023 design an inference process consisting in performing inference at every timestep $`t`$ and then aggregate overlapping chunks using chunks’ exponential moving average.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act.png" style="width-90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act.png" style="width-90.0%" />
 <p>&lt;span id="ch4-act" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Action Chunking with Transformer (ACT), as in @zhaoLearningFineGrainedBimanual2023. ACT introduces an action chunking paradigm to cope with high-dimensional multi-modal demonstration data, and a transformer-based CVAE architecture.</figcaption>
 </figure>
@@ -779,7 +842,7 @@ In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn
 In ACT (Figure <a href="#ch4-act" data-reference-type="ref" data-reference="ch4-act">[ch4-act]</a>), inference for a given observation $`o \in \mathcal O`$ could be performed by (1) computing a prior $`p_\omega(z \vert o)`$ for the latent and (2) decoding an action chunk from a sampled latent $`z \sim p_\omega(\bullet \vert o)`$, similarily to how standard VAEs generate samples, with the exception that vanilla VAEs typically pose $`p(z\vert o) \equiv p(z) \sim N(\mathbf{0}, \mathbf{I})`$ and thus skip (1).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-encoder.png" style="width:75.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-encoder.png" style="width:75.0%" />
 <p>&lt;span id="ch4-act-encoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The CVAE encoder used in ACT. Input action chunks are first embedded and aggregated with positional embeddings, before being processed alongside embedded proprioperceptive information, and a learned <code>[CLS]</code> token used to aggregate input level information, and predict the style variable <span class="math inline"><em>z</em></span>. The encoder is entirely disregarded at inference time.</figcaption>
 </figure>
@@ -787,7 +850,7 @@ In ACT (Figure <a href="#ch4-act" data-reference-type="ref" data-reference="ch4
 However, the authors claim using a deterministic procedure to derive $`z`$ may benefit policy evaluation, and thus avoid sampling from the conditional prior at all. At test time, instead, they simply use $`z = \mathbf{0}`$, as the conditional prior on $`z`$ used in training is set to be the unit Gaussian. At test time, conditioning on the observation $`o`$ is instead achieved through explicitly feeding proprioperceptive and visual observations to the decoder, $`p_\theta(a \vert z, o)`$, while during training $`z`$ is indeed sampled from the approximate posterior distribution $`p_\phi(z \vert o, a)`$, which, however, disregards image observations and exclusively uses proprioperceptive states to form $`o`$ for efficiency reasons (as the posterior $`q_\phi`$ is completely disregarded at test time).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-act-decoder.png" style="width:75.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-act-decoder.png" style="width:75.0%" />
 <p>&lt;span id="ch4-act-decoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The CVAE decoder used in ACT, comprising of a full encoder-decoder Transformer architecture. Camera observations from all <span class="math inline"><em>n</em></span> camera views are first embedded using pre-trained visual encoders, and then concatenated to the corresponding positional embeddings. Then, alongside embeddings for the proprioperceptive information available and the style variable <span class="math inline"><em>z</em></span> retrieved from the CVAE encoder, the Transformer encoder shares the matrices <span class="math inline"><em>K</em>, <em>Q</em></span> with the Transformer decoder, trained to decode fixed position embeddings into action valid chunks.</figcaption>
 </figure>
@@ -798,18 +861,20 @@ However, the authors claim using a deterministic procedure to derive $`z`$ may b
 
 DMs proved very effective in approximating complex highly dimensional distributions, such as distributions over images @hoDenoisingDiffusionProbabilistic2020 or videos @polyakMovieGenCast2025, thanks to their inherent capability to deal with multimodal data and training stability. In Diffusion Policy (DP), @chiDiffusionPolicyVisuomotor2024 present an application of DMs the field of robot learning, leveraging diffusion to model human expert demonstrations in a variety of simulated and real-world tasks. Similarily to Action Chunking with Transformer @zhaoLearningFineGrainedBimanual2023, @chiDiffusionPolicyVisuomotor2024 (1) adopt a modified *observation-conditioned target distribution* instead of the full joint $`p(o,a)`$ and (2) predict multiple actions into the future instead of a single action. Besides the intractability of the observations’ marginal $`p_\theta(o)`$ given $`p_\theta(o,a)`$, DP’s rationale for modeling the data distribution via $`p_\theta(a \vert o)`$ stems from the rather test-time compute intensive nature of diffusion, whereby generating actions *alongside* observations is likely to result in higher complexity and thus a likely larger number of denoising operations, which would prove ultimately pointless considering robotics applications rely on the capability to generate controls rather than reproducing observations.
 
-In practice, conditioning on observation data is achieved conditioning the added noise regressor $`\epsilon_\theta`$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $`T_o`$ observations, resulting in the *conditional* simplified diffusion objective 
-$$
-`\htmlId{diffusion-policy-objective}{\mathcal L(\theta) = \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[
-        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],\\
-    t \sim \mathcal{U}(\{1,\dots,T\}), \quad
+In practice, conditioning on observation data is achieved conditioning the added noise regressor $`\epsilon_\theta`$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $`T_o`$ observations, resulting in the *conditional* simplified diffusion objective
+``` math
+\begin{align}
+    \mathcal L(\theta) &= \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[
+        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],  \\
+        & t \sim \mathcal{U}(\{1,\dots,T\}), \quad
         a_{t:t+T_a}, o_{t-T_o:t} \sim \mathcal{D}, \quad
-        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag}`
-$$
- Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $`t`$ *and* on a stack of previous observations $`o_{t-T_o-t}`$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag 
+\end{align}
+```
+Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $`t`$ *and* on a stack of previous observations $`o_{t-T_o-t}`$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-diffusion-policy.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-diffusion-policy.png" style="width:90.0%" />
 <p>&lt;span id="diffusion-policy-architecture" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The Diffusion Policy archicture, as in @chiDiffusionPolicyVisuomotor2024. A stack of <span class="math inline"><em>H</em><sub><em>o</em></sub></span> previous observations is used as external conditioning to denoise a group of <span class="math inline"><em>H</em><sub><em>a</em></sub></span> actions. Conditioning is used at every layer of a U-Net block, and in practice allows to obtain fully-formed action chunks with as little as <span class="math inline"><em>T</em> = 10</span> denoising steps.</figcaption>
 </figure>
@@ -834,7 +899,7 @@ We directly assess the lack of adaptiveness of robot systems due to acting open-
 
 <figure>
 <div class="minipage">
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-async-inference.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-async-inference.png" style="width:90.0%" />
 <p>&lt;span id="ch4-async-inference" style="position: absolute;"&gt;&lt;/span&gt;</p>
 </div>
 <figcaption><strong>Asynchronous inference</strong>. Illustration of the asynchronous inference stack. Note that the policy can be run on a remote server, possibly with GPUs.</figcaption>
@@ -874,7 +939,7 @@ Interestingly, the behavior of async inference can be studied analytically. Firs
 
 <figure>
 <div class="minipage">
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch4/ch4-queues.png" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch4/ch4-queues.png" />
 <p>&lt;span id="ch4-queues" style="position: absolute;"&gt;&lt;/span&gt;</p>
 </div>
 <figcaption>Action queue size evolution at runtime for various levels of <span class="math inline"><em>g</em></span> when (A) not filtering out observation based on joint-space similarity and (B) filtering out near-duplicates observation, measuring their similarity in joint-space.</figcaption>
@@ -905,7 +970,7 @@ TL;DR Openly available large scale datasets and the development of stable, expre
 The advent of large models trained on internet-scale datasets has drastically influenced fields like Computer Vision (CV) and Natural Language Processing (NLP), shifting the paradigm towards combining (1) an initial, task-agnostic large-scale pre-training stage and a (2) task-specific, adjustment phase. The pre-training/adaptation paradigm has now largely replaced more classic approaches consisting of task-specific data collection, curation and model training in many subdomains within CV and NLP, motivated by the main drawback of limited scalability for *task-specific approaches*, traditionally labor intensive. Factors including (1) the advancements in generalist models learned with self-supervision for perception @oquabDINOv2LearningRobust2024 or semantic understanding @devlinBERTPretrainingDeep2019 and (2) the popularization collective efforts to aggregate large-scale openly available datasets @collaborationOpenXEmbodimentRobotic2025, @khazatskyDROIDLargeScaleInTheWild2025 are increasingly pushing the field of robot learning towards the pre-train-and-adapt paradigm. This shift taps into the long-standing challenge of developing generalist robot policies, and holds the premise to surpass traditionally siloed approaches to robotics problems and develop a *foundation robotics model*. While Section <a href="#learning-bc-single" data-reference-type="ref" data-reference="learning-bc-single">[learning-bc-single]</a> introduced methods for learning *single-task policies* such as ACT or Diffusion Policy, in this section we present advancements in developing *generalist, multi-task, policies*, capable of performing a wide range of tasks across different environments and embodiments, and guided by unstructured instructions given via natural language.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-ml-vs-robotics-foundation.png" style="width:90.0%" />
 <p>&lt;span id="ch5-ml-vs-robotics-foundation" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Fields within ML such as Computer Vision and NLP converged on the development of foundation models, trained on a variety of large scale models and capable to perform multiple downstream tasks (top). Conversely, robotics suffered from limited standardization in terms of the architectures used, and siloed, task specific datasets, incurring in a high degree of fragmentation which traditionally hindered the development of generalist models for robotics in favour of task-specific models (bottom).</figcaption>
 </figure>
@@ -915,7 +980,7 @@ The advent of large models trained on internet-scale datasets has drastically in
 The remarkable success of foundation models in NLP and CV is predicated on two core principles: architectural innovation and joint data-compute scaling. The transformer architecture proved instrumental in capturing long-range dependencies in sequential data such as text, and its stability and expressivity made it the *de facto* standard for modern large-scale models trained on internet-scale amounts of data. In stark contrast with popular NLP @raffelExploringLimitsTransfer2023 and CV @ImageNet_VSS09 general-purpose datasets, the field of robotics has historically developed around task-specific datasets which hinders scalability across problems, resulting in a concrete data deficit for general-purpose robot learning. Unlike the wealth of relatively readily available text and images on the internet, robotics data is intrinsically embodied--datasets collected for a manipulation robot typically differ entirely from locomotion datasets. Further, datasets consisting of expert demonstrations are (1) intrinsically expensive to collect (2) and notoriously heterogeneous--different human experts may perform the same task optimally yet in very different ways. In particular, since each expert trajectory is tied to a specific robot platform and the operating conditions of its environment and task, data heterogeneity has long posed a *methodological* challenge for scaling robotics datasets via aggregation. Beyond this, heterogeneity also raises *conceptual* issues: naively mixing data across embodiments can induce negative transfer, as control strategies developed in isolation for different robot systems in different environments may even conflict when combined. Thus, the high degree of fragmentation of robotics datasets and tasks has traditionally led to the development of *specialist* policies, trained on small, task-specific datasets, and which excel at their designated task but fail to generalize to new situations (Figure <a href="#ch5-ml-vs-robotics-foundation" data-reference-type="ref" data-reference="ch5-ml-vs-robotics-foundation">[ch5-ml-vs-robotics-foundation]</a>).
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png" style="width-80.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-generalist-policies-timeline.png" style="width-80.0%" />
 <p>&lt;span id="ch5-generalist-policies-timeline" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Early efforts in the development of generalist models for robotics include BC-Zero @jangBCZZeroShotTask2022, RT-1 @brohanRT1RoboticsTransformer2023, and RT-2 @brohanRT2VisionLanguageActionModels2023: large scale models trained on thousands of demonstrations. The open release of the Open-X @collaborationOpenXEmbodimentRobotic2025 and DROID datasets @khazatskyDROIDLargeScaleInTheWild2025 fostered the development of open source models: OpenVLA @kimOpenVLAOpenSourceVisionLanguageAction2024, <span class="math inline"><em>π</em><sub>0</sub></span> @blackp0VisionLanguageActionFlow2024 and SmolVLA @shukorSmolVLAVisionLanguageActionModel2025.</figcaption>
 </figure>
@@ -929,7 +994,7 @@ Traditionally, research involved not only training the model but also collecting
 The success of large, proprietary models like RT-1 and RT-2, highlighted a growing accessibility gap in robotics research, as training and deploying large-scale models requires computational resources simply unattainable for most research institutions. The OpenVLA project @kimOpenVLAOpenSourceVisionLanguageAction2024 emerged in direct contrast of closed-source counterparts, as a community-driven effort to create powerful, openly available VLAs. In particular, @kimOpenVLAOpenSourceVisionLanguageAction2024 trained OpenVLA by exclusively leveraging openly available data (970K+ from the Open-X dataset), and share training recipes alongside the model weights. Architecturally, OpenVLA integrates a pre-trained vision encoder to project visual tokens into the embedding space of Llama2-7B @touvronLlama2Open2023 language model backbone. The language model backbone is then used to predict *discrete action tokens* over 256 activation levels.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-trends.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-trends.png" style="width:90.0%" />
 <p>&lt;span id="ch5-trends" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>Robot learning is undergoing a paradigmatic shift: centralized data collections (A, left) are increasingly larger, often comprising Ms of demonstrations, and (A, right) decentralized approaches to data collection are also rising as an alternative for large scale data collection. (B) Generalist models are also becoming increasingly smaller and easier to run on limited hardware.</figcaption>
 </figure>
@@ -953,7 +1018,7 @@ Recently, compute efficiency has also become a central focus in VLM research. Se
 $`\pi_0`$ @blackp0VisionLanguageActionFlow2024 introduce a VLA consisting of a MoE architecture consisting of (1) a pre-trained VLM backbone (Gemma 2.6B @teamGemma2Improving2024) and (2) a dedicated action expert used to generate continuous actions via flow matching. Images and language are embedded with a late-fusion VLM (PaliGemma), while proprioceptive state and actions chunks are routed to a smaller action expert, initialized from scratch. The two separate experts communicate via self-attention layers, but maintain disjoint weights to obtain query, key and values matrices at each layer, maintaining specialization while efficiently allocating computation.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0.png" style="width:90.0%" />
 <p>&lt;span id="ch5-pi0" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The <span class="math inline"><em>π</em><sub>0</sub></span>architecture, as in @blackp0VisionLanguageActionFlow2024. Vision and language tokens are routed to a VLM backbone which is prevented from attending robot proprioperceptive states and action tokens, which are instead routed to a smaller subset of weights within the architecture. The architecture is trained with Flow Matching on 10M+ trajectories from a mixture of closed and openly available datasets.</figcaption>
 </figure>
@@ -967,20 +1032,22 @@ Concretely, $`\pi_0`$ is a unified transformer with two disjoint sets of weights
     },
     \quad \mathbf{1}: \text{Bidirectional Attention}, \ \mathbf{0}: \text{Masked Attention}`$ Note how *intra*-block directional attention allows tokens to communicate freely, while *inter*-block communication is mediated by the attention mask $`\mathbf{A}`$. *Blockwise causal masking* effectively prevents the pre-trained perception-language tokens from attending to robotics-tokens, likely out of distribution for VLM backbones traditionally trained on large corpora of internet, non-robotics, data. Crucially, because communication is obstructed between image-language tokens, proprioperceptive and action tokens, one can cache keys and values across denoising steps at runtime time, incuring in a reduced computational footprint and faster inference.
 
-In $`\pi_0`$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing: 
-$$
-`\htmlId{pi0-loss}{\mathcal{L}(\phi, \theta) = 
+In $`\pi_0`$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing:
+``` math
+\begin{align}
+    \mathcal{L}(\phi, \theta) &= 
     \mathbb{E}_{\tau, \epsilon, o_t, a_{t:t+H_a}}\Big[
         \big\Vert 
             v_\theta(\underbrace{\tau a_{t:t+H_a} + (1-\tau) \epsilon}_{\tilde a_{t:t+H_a}},\, o_t,\, \tau)
             - (\epsilon - a_{t:t+H_a})
         \big\Vert^2
-    \Big],\\
-    \tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad
+    \Big],  \\
+    &\tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad
     \epsilon \sim \mathcal{N}(\mathbf{0}, \mathbf{I}), \quad
-    o_t, a_{t:t+H_a} \sim \mathcal D \notag}`
-$$
- Where the experts parametrized by the separate weights $`\phi, \theta`$ interact with each other via self-attention layers only, so that the action expert $`v_\theta`$ internal computations also depend on the VLM backbone’s parameters $`\phi`$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
+    o_t, a_{t:t+H_a} \sim \mathcal D \notag
+\end{align}
+```
+Where the experts parametrized by the separate weights $`\phi, \theta`$ interact with each other via self-attention layers only, so that the action expert $`v_\theta`$ internal computations also depend on the VLM backbone’s parameters $`\phi`$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
 ``` math
 \begin{equation}
     a_{t:t+H_a}^{\tau + \delta} = a_{t:t+H_a}^{\tau } + \delta v_\theta(a_{t:t+H_a}^{\tau }, o_t)
@@ -991,7 +1058,7 @@ Flow matching  can be seen as a continuous time, detetrministic generalization
 
 <div class="wrapfigure">
 
-r0.4 <img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png" alt="image" />
+r0.4 <img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-pi0-sampling-timesteps.png" alt="image" />
 
 \<span id="ch5-pi0-sampling-timesteps" style="position: absolute;"\>\</span\>
 
@@ -1010,7 +1077,7 @@ Lastly, @blackp0VisionLanguageActionFlow2024 present cross-embodiment experimen
 VLAs remain in an early stage of development and are not yet as mature or widely adopted as LLMs and VLMs. Further, much of the impactful VLA progress remains proprietary, with many models sharing only weights while withholding full training details and essential methodological components. SmolVLA @shukorSmolVLAVisionLanguageActionModel2025 is an entirely open-source research effort, aiming to democratize the developments of robotics foundation models by open sourcing model, training recipes and data used.
 
 <figure>
-<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-markdown/output/assets/image/figures/ch5/ch5-smolvla.png" style="width:90.0%" />
+<img src="/Users/thibaudfrere/Documents/work-projects/huggingface/research-article-template/app/scripts/latex-to-mdx/output/assets/image/figures/ch5/ch5-smolvla.png" style="width:90.0%" />
 <p>&lt;span id="ch5-smolvla" style="position: absolute;"&gt;&lt;/span&gt;</p>
 <figcaption>The SmolVLA architecture, as in @shukorSmolVLAVisionLanguageActionModel2025. SmolVLA is a compact MoE model trained with flow matching to denoise action chunks. Vision and language tokens are fed to a VLM backbone, and share information with the proprioperceptive and action tokens via the attention mechanism. The attention expert interleaves SA and CA layers for further conditioning on the visual features from the VLM backbone. SmolVLA skips computations and reduces the visual tokens, resulting in 6x less memory usage than <span class="math inline"><em>π</em><sub>0</sub></span>.</figcaption>
 </figure>
diff --git a/app/scripts/latex-to-markdown/output/main.mdx b/app/scripts/latex-to-mdx/output/main.mdx
similarity index 91%
rename from app/scripts/latex-to-markdown/output/main.mdx
rename to app/scripts/latex-to-mdx/output/main.mdx
index 4eb0c151f674be4e9c1b5e21bc569f85e9da7f86..9ad4c1e32ebca86fca36c154b9262b785a19a0ae 100644
--- a/app/scripts/latex-to-markdown/output/main.mdx
+++ b/app/scripts/latex-to-mdx/output/main.mdx
@@ -89,7 +89,7 @@ We sincerely hope this tutorial serves as a valuable starting point for your jou
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="figure1" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="figure1" style="position: absolute;"></span>
 <figcaption><code>lerobot</code> is the open-source library for end-to-end robotics developed by Hugging Face. The library is vertically integrated on the entire robotics stack, supporting low-level control of real-world robot devices, advanced data and inference optimizations, as well as SOTA robot learning methods with simple implementations in pure Pytorch.</figcaption>
 </figure>
 
@@ -181,7 +181,12 @@ streaming_dataset = StreamingLeRobotDataset(
 # Get the 100th frame in the dataset by 
 sample = dataset[100]
 print(sample)
-# 
+# {
+# 'observation.state': tensor([...]), 
+# 'action': tensor([...]), 
+# 'observation.images.wrist_camera': tensor([3, C, H, W]), for delta timesteps
+# ...
+# }
 
 batch_size=16
 # wrap the dataset in a DataLoader to use process it batches for training purposes
@@ -233,7 +238,7 @@ TL;DR Learning-based approaches to robotics are motivated by the need to (1) gen
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="generating-motion-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="generating-motion-atlas" style="position: absolute;"></span>
 <figcaption>Overview of methods to generate motion (clearly non-exhausitve, see @bekrisStateRobotMotion2024). The different methods can be grouped based on whether they explicitly (<em>dynamics-based</em>) or implicitly (<em>learning-based</em>) model robot-environment interactions.</figcaption>
 </figure>
 
@@ -251,7 +256,7 @@ Methods to produce robotics motion range from traditional *explicit* models--<sp
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotics-platforms-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotics-platforms-atlas" style="position: absolute;"></span>
 <figcaption>Different kinds of motions are achieved with potentially very different robotic platforms. From left to right, top to bottom: ViperX, SO-100, Boston Dynamics’ Spot, Open-Duck, 1X’s NEO, Boston Dynamics’ Atlas. This is an example list of robotic platforms and is (very) far from being exhaustive.</figcaption>
 </figure>
 
@@ -275,7 +280,7 @@ Recently, the development of low-cost manipulators like the ALOHA @zhaoLearning
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotic-platforms-costs" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotic-platforms-costs" style="position: absolute;"></span>
 <figcaption>Cheaper, more accessible robots are starting to rival traditional platforms like the Panda arm platforms in adoption in resource-constrained scenarios. The SO-100, in particular, has a cost in the 100s of Euros, and can be entirely 3D-printed in hours, while the industrially-manufactured Panda arm costs tens of thousands of Euros and is not openly available.</figcaption>
 </figure>
 
@@ -289,7 +294,7 @@ Deriving an intuition as per why learning-based approaches are gaining popularit
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="make-so100-planar-manipulator" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="make-so100-planar-manipulator" style="position: absolute;"></span>
 <figcaption>The SO-100 arm is a 6-dof manipulator arm. Preventing some of its joints (shoulder pane, wrist flex and wrist roll) from actuating, it can be represented as a traditional 2-dof planar manipulator (the gripper joint in the end-effector is not considered towards the count of the degrees of freedom used to produce motion).</figcaption>
 </figure>
 
@@ -308,7 +313,7 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulation-simple" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulation-simple" style="position: absolute;"></span>
 <figcaption>Free to move</figcaption>
 </figure>
 <figure>
@@ -319,7 +324,7 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulator-floor" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulator-floor" style="position: absolute;"></span>
 <figcaption>Constrained by the surface</figcaption>
 </figure>
 <figure>
@@ -330,25 +335,24 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulator-floor-shelf" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulator-floor-shelf" style="position: absolute;"></span>
 <figcaption>Constrained by surface and (fixed) obstacle</figcaption>
 </figure>
 <figcaption>Planar, 2-dof schematic representation of the SO-100 manipulator under diverse deployment settings. From left to right: completely free of moving; constrained by the presence of the surface; constrained by the surface and presence of obstacles. Circular arrows around each joint indicate the maximal rotation feasible at that joint.</figcaption>
 </figure>
 
-Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $p \in \mathbb R^2$ as a function of the robot’s configuration, $p = p(q), p: \mathcal Q \mapsto \mathbb R^2$. In particular, we have: 
-
-$$
-`p(q) = \begin{pmatrix} p_x(\theta_1, \theta_2)\\ p_y(\theta_1, \theta_2) \end{pmatrix} = \begin{pmatrix} l \cos(\theta_1) + l \cos(\theta_1 + \theta_2)\\ l \sin(\theta_1) + l \sin(\theta_1 + \theta_2) \end{pmatrix} \in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}`
-$$
-
-
+Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $p \in \mathbb R^2$ as a function of the robot’s configuration, $p = p(q), p: \mathcal Q \mapsto \mathbb R^2$. In particular, we have: $p(q) = \begin{pmatrix} p_x(\theta_1, \theta_2) \\ p_y(\theta_1, \theta_2) \end{pmatrix} = \begin{pmatrix} l \cos(\theta_1) + l \cos(\theta_1 + \theta_2) \\ l \sin(\theta_1) + l \sin(\theta_1 + \theta_2) \end{pmatrix} \in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}$
 
 Deriving the end-effector’s *pose*--position *and* orientation--in some $m$-dimensional space $\boldsymbol{p} \in \mathcal{P} \subset \mathbb{R}^{m}$ starting from the configuration ${\textnormal{q}}\in \mathcal Q \subset \mathbb R^n$ of a $n$-joints robot is referred to as *forward kinematics* (FK), whereas identifying the configuration corresponding to any given target pose is termed *inverse kinematics* (IK). In that, FK is used to map a robot configuration into the corresponding end-effector pose, whereas IK is used to reconstruct the configuration(s) given an end-effector pose.
 
 In the simplified case here considered (for which $\boldsymbol{p} \equiv p$, as the orientation of the end-effector is disregarded for simplicity), one can solve the problem of controlling the end-effector’s location to reach a goal position $p^*$ by solving analytically for $q: p(q) = f_{\text{FK}}(q) = p^*$. However, in the general case, one might not be able to solve this problem analytically, and can typically resort to iterative optimization methods comparing candidate solutions using a loss function (in the simplest case, $\Vert p(q) - p^* \Vert_2^2$ is a natural candidate), yielding:
 
-$\htmlId{ik_problem}{\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .}$
+``` math
+\begin{align}
+\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .
+
+\end{align}
+```
 
 Exact analytical solutions to IK are even less appealing when one considers the presence of obstacles in the robot’s workspace, resulting in constraints on the possible values of $q \in \mathcal Q \subseteq [-\pi, +\pi]^n \subset \mathbb R^n$ in the general case of $n$-links robots.
 
@@ -356,7 +360,13 @@ For instance, the robot in Figure <a href="#planar-manipulator-floor" data-refe
 
 However, IK--solving eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> for a feasible $q$--only proves useful in determining information regarding the robot’s configuration in the goal pose, and crucially does not provide information on the *trajectory* to follow over time to reach a target pose. Expert-defined trajectories obviate to this problem providing a length-$K$ succession of goal poses $\tau_K = [p^*_0, p^*_1, \dots p^*_K]$ for tracking. In practice, trajectories can also be obtained automatically through *motion planning* algorithms, thus avoiding expensive trajectory definition from human experts. However, tracking $\tau_K$ via IK can prove prohibitively expensive, as tracking would require $K$ resolutions of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> (one for each target pose). *Differential* inverse kinematics (diff-IK) complements IK via closed-form solution of a variant of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>. Let $J(q)$ denote the Jacobian matrix of (partial) derivatives of the FK-function $f_\text{FK}- \mathcal Q \mapsto \mathcal P$, such that $J(q) = \frac{\partial f_{FK}(q)}{\partial q }$. Then, one can apply the chain rule to any $p(q) = f_{\text{FK}}(q)$, deriving $\dot p = J(q) \dot q$, and thus finally relating variations in the robot configurations to variations in pose, thereby providing a platform for control.
 
-Given a desired end-effector trajectory $\dot {p}^*(t)$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $\dot q(t)$ solving for joints’ *velocities* instead of *configurations*, $\htmlId{reg_ik_velocity}{\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2}$
+Given a desired end-effector trajectory $\dot {p}^*(t)$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $\dot q(t)$ solving for joints’ *velocities* instead of *configurations*,
+``` math
+\begin{align}
+\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2
+
+\end{align}
+```
 
 Unlike eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>, solving for $\dot q$ is much less dependent on the environment (typically, variations in velocity are constrained by physical limits on the actuators). Conveniently, eq. <a href="#reg_ik_velocity" data-reference-type="ref" data-reference="reg_ik_velocity">[reg_ik_velocity]</a> also often admits the closed-form solution $\dot q = J(q)^+ \dot {p}^*$, where $J^+(q)$ denotes the Moore-Penrose pseudo-inverse of $J(q)$. Finally, discrete-time joint configurations $q$ can be reconstructed from joint velocities $\dot q$ using forward-integration on the continuous-time joint velocity , $q_{t+1} = q_t + \Delta t\,\dot q_t$ for a given $\Delta t$, resulting in tracking via diff-IK.
 
@@ -401,7 +411,7 @@ Despite the last 60+ years of robotics research, autonomous robots are still lar
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="classical-limitations" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="classical-limitations" style="position: absolute;"></span>
 <figcaption>Dynamics-based approaches to robotics suffer from several limitations: (1) orchestrating multiple components poses integration challenges; (2) the need to develop custom processing pipelines for the sensing modalities and tasks considered hinders scalability; (3) simplified analytical models of physical phenomena (here friction at the gripper; credits to @antonovaReinforcementLearningPivoting2017) limit real-world performance. Lastly, (4) dynamics-based methods overlook trends in the availability and growth of robotics data.</figcaption>
 </figure>
 
@@ -438,7 +448,7 @@ TL;DR The need for expensive high-fidelity simulators can be obviated by learnin
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robot-learning-upsides" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robot-learning-upsides" style="position: absolute;"></span>
 <figcaption>Learning-based robotics streamlines perception-to-action by learning a (1) unified high-level controller capable to take (2) high-dimensional, unstructured sensorimotor information. Learning (3) does not require a dynamics model and instead focuses on interaction data, and (4) empirically correlates with the scale of the data used. </figcaption>
 </figure>
 
@@ -454,7 +464,7 @@ Being a field at its relative nascent stages, no prevalent technique(s) proved d
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robot-learning-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robot-learning-atlas" style="position: absolute;"></span>
 <figcaption>Overview of the robot learning methods implemented in <code>lerobot</code>.</figcaption>
 </figure>
 
@@ -470,7 +480,7 @@ Figure <a href="#robot-learning-atlas" data-reference-type="ref" data-reference
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotics-with-rl-examples" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotics-with-rl-examples" style="position: absolute;"></span>
 <figcaption>Examples of two different robotics tasks performed using RL. In the manipulation task (A) an agent learns to reach for a yellow plastic block in its environment, and to put it inside of a box. In the locomotion task (B) an agent learns to move its center of mass sideways without falling.</figcaption>
 </figure>
 
@@ -488,7 +498,7 @@ The RL framework @suttonReinforcementLearningIntroduction2018, which we briefly
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="rl-most-famous-pic" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="rl-most-famous-pic" style="position: absolute;"></span>
 <figcaption>Agent-Environment interaction diagram (image credits to @suttonReinforcementLearningIntroduction2018).</figcaption>
 </figure>
 
@@ -510,30 +520,35 @@ A length-$T$ *trajectory* is the (random) sequence
 ``` math
 \htmlId{trajectory_definition}{\tau = (s_0, a_0, r_0, s_1, a_1, r_1, \dots, s_{T-1}, a_{T-1}, r_{T-1}, s_T),}
 ```
-with per-step rewards defined as $r_t = r (s_t, a_t, s_{t+1})$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*: 
 
-$$
-`\htmlId{dynamics_markovian}{\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) = \mathbb P (s_{t+1}\vert s_t, a_t)\\ \mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) = \mathbb P(a_t\vert s_t)}`
-$$
+with per-step rewards defined as $r_t = r (s_t, a_t, s_{t+1})$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*:
 
- The probability of observing a given trajectory $\tau$ factorizes into
+``` math
+\begin{align}
+\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) &= \mathbb P (s_{t+1}\vert s_t, a_t) \\
+\mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) &= \mathbb P(a_t\vert s_t) 
+\end{align}
+```
+The probability of observing a given trajectory $\tau$ factorizes into
 ``` math
 \htmlId{traj_prob}{\mathbb P(\tau) = \mathbb P (s_0) \prod_{t=0}^{T-1} \mathbb P (s_{t+1}\vert s_t, a_t)\ \mathbb P(a_t\vert s_t).}
 ```
 
 Policies $\mathbb P(a_t\vert s_t)$ are typically indicated as $\pi(a_t\vert s_t)$, and often parametrized via $\theta$, yielding $\pi_\theta (a_t\vert s_t)$. Policies are trained optimizing the (discounted) *return* associated to a given $\tau$, i.e. the (random) sum of measured rewards over trajectory:
+
 ``` math
 G(\tau) = \sum_{t=0}^{T-1} \gamma^{t} r_t.
 ```
-In that, agents seek to learn control strategies (*policies*, $\pi_\theta$) maximizing the expected return $\mathbb E_{\tau \sim \pi_\theta} G(\tau)$. For a given dynamics $\mathcal D$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $\Pi$, yielding the (maximization) target $J : \Pi \mapsto \mathbb R$ 
-
-$$
-`\htmlId{RL-j-function}{J(\pi_\theta) = \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],\\ \mathbb P_{\theta; \mathcal D} (\tau) = \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).}`
-$$
-
-
+In that, agents seek to learn control strategies (*policies*, $\pi_\theta$) maximizing the expected return $\mathbb E_{\tau \sim \pi_\theta} G(\tau)$. For a given dynamics $\mathcal D$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $\Pi$, yielding the (maximization) target $J : \Pi \mapsto \mathbb R$
+``` math
+\begin{align}
+    J(\pi_\theta) &= \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],  \\
+    \mathbb P_{\theta; \mathcal D} (\tau) &= \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).
+\end{align}
+```
 
 Because in the RL framework the agent is assumed to only be able to observe the environment dynamics and not to intervene on them, <a href="#RL-j-function" data-reference-type="ref" data-reference="RL-j-function">[RL-j-function]</a> varies exclusively with the policy followed. In turn, MDPs naturally provide a framework to optimize over the space of the possible behaviors an agent might enact ($\pi \in \Pi$), searching for the *optimal policy* $\pi^* = \arg \max_{\theta} J(\pi_\theta)$, where $\theta$ is the parametrization adopted by the policy set $\Pi: \pi_\theta \in \Pi, \ \forall \theta$. Other than providing a target for policy search, $G(\tau)$ can also be used as a target to discriminate between states and state-action pairs. Given any state $s \in \mathcal S$--e.g., a given configuration of the robot--the *state-value* function
+
 ``` math
 V_\pi(s) = \mathbb E_{\tau \sim \pi} [G(\tau) \big \vert s_0 = s]
 ```
@@ -541,13 +556,17 @@ can be used to discriminate between desirable and undesirable state in terms of
 ``` math
 Q_\pi(s,a) = \mathbb E_{\tau \sim \pi} [G (\tau) \big \vert s_0 = s, a_0=a]
 ```
-Crucially, value functions are interrelated: 
 
-$$
-`\htmlId{q-as-v}{Q_\pi(s_t, a_t) = \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]\\ V_\pi(s_t) = \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]}`
-$$
+Crucially, value functions are interrelated:
 
- Inducing an ordering over states and state-action pairs under $\pi$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
+``` math
+\begin{align}
+Q_\pi(s_t, a_t) &= \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]  \\
+V_\pi(s_t) &= \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]
+
+\end{align}
+```
+Inducing an ordering over states and state-action pairs under $\pi$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
 
 <figure>
 <ResponsiveImage
@@ -557,7 +576,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="rl-algos-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="rl-algos-atlas" style="position: absolute;"></span>
 <figcaption>Popular RL algorithms. See @SpinningUp2018 for a complete list of citations.</figcaption>
 </figure>
 
@@ -579,7 +598,7 @@ Second, learning with a limited number of samples remains problematic in RL, <sp
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="synthetic-vs-real-duck" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="synthetic-vs-real-duck" style="position: absolute;"></span>
 <figcaption>Simulated (left) vs. real-world (right) OpenDuck. Discrepancies in the simulation dynamics (<em>reality gap</em>) pose risks to policy transfer.</figcaption>
 </figure>
 
@@ -593,7 +612,7 @@ Training RL policies in simulation @tobinDomainRandomizationTransferring2017 ad
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ducks-on-terrains" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ducks-on-terrains" style="position: absolute;"></span>
 <figcaption>The same locomotion task can be carried out in different (simulated) domains (exemplified by the difference in terrains) at training time, resulting to increased robustness over diverse environment dynamics.</figcaption>
 </figure>
 
@@ -628,25 +647,39 @@ Q_{i+1}(s_t, a_t) \leftarrow \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t
 ```
 Then, one can derive the (ideally, near-optimal) policy by explicitly maximizing over the action space the final (ideally, near-optimal) estimate $Q_K \approx Q^*$ at each timestep. In fact, under certain assumptions on the MDP considered, $Q_K \to Q^* \, \text{as } K \to \infty$.
 
-Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $\mathcal S\times \mathcal A$ problems, in which the storing of $Q : \mathcal S\times \mathcal A\mapsto \mathbb R$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $\theta$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $\delta_i$): 
-
-$$
-`\htmlId{dqn-loss}{\mathcal L(\theta_i) = \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} \big[ (\underbrace{y_i - Q_{\theta_i}(s_t, a_t)}_{\delta_i})^2 \big],\\ y_i = \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big],}`
-$$
-
- Where $\chi$ represents a behavior distribution over state-action pairs. Crucially, $\chi$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $(s_t, a_t, r_t, s_{t+1})$ transitions, used to form the TD-target $y_i$, TD-error $\delta_i$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
+Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $\mathcal S\times \mathcal A$ problems, in which the storing of $Q : \mathcal S\times \mathcal A\mapsto \mathbb R$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $\theta$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $\delta_i$):
+``` math
+\begin{align}
+\mathcal L(\theta_i) &= \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} 
+    \big[ 
+        (\underbrace{y_i - Q_{\theta_i}(s_t, a_t)}_{\delta_i})^2 
+    \big],  \\
+    y_i &= \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big], 
+\end{align}
+```
+Where $\chi$ represents a behavior distribution over state-action pairs. Crucially, $\chi$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $(s_t, a_t, r_t, s_{t+1})$ transitions, used to form the TD-target $y_i$, TD-error $\delta_i$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
 
 While effective in handling large, unstructured state spaces for discrete action-space problems, DQN application’s to continous control problems proved challenging. Indeed, in the case of high-capacity function approximators such as neural networks, solving $\max_{a_t \in \mathcal A} Q_\theta(s_t, a_t)$ at each timestep is simply unfeasible due to the (1) continous nature of the action space ($\mathcal A\subset \mathbb R^n$ for some $n$) and (2) impossibility to express the find a cheap (ideally, closed-form) solution to $Q_\theta$.  @silverDeterministicPolicyGradient2014 tackle this fundamental challenge by using a *deterministic* function of the state $s_t$ as policy, $\mu_\phi(s_t) = a_t$, parametrized by $\phi$. Thus, policies can be iteratively refined updating $\phi$ along the direction:
 ``` math
 \htmlId{deterministic-pg}{d_\phi = \mathbb E_{s_t \sim \mathbb P (\bullet)} [\nabla_\phi Q(s_t, a_t)\vert_{a_t = \mu_\phi(s_t)}] = \mathbb E_{s_t \sim \mathbb P(\bullet)} [\nabla_{a_t} Q(s_t, a_t) \vert_{a_t = \mu_\phi(s_t)} \cdot \nabla_\phi \mu(s_t)]}
 ```
+
 Provably, <a href="#deterministic-pg" data-reference-type="ref" data-reference="deterministic-pg">[deterministic-pg]</a> is the *deterministic policy gradient* (DPG) of the policy $\mu_\phi$ @silverDeterministicPolicyGradient2014, so that updates $\phi_{k+1}\leftarrow \phi_k + \alpha d_\phi$ are guaranteed to increase the (deterministic) cumulative discounted reward, $J(\mu_\phi)$.  @lillicrapContinuousControlDeep2019 extended DPG to the case of (1) high-dimensional unstructured observations and (2) continuous action spaces, introducing Deep Deterministic Policy Gradient (DDPG), an important algorithm RL and its applications to robotics. DDPG adopts a modified TD-target compared to the one defined in <a href="#TD-target" data-reference-type="ref" data-reference="TD-target">[TD-target]</a>, by maintaining a policy network used to select actions, yielding
+
 ``` math
 \htmlId{TD-target-ddpg}{y_i = \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma Q_{\theta_{i-1}} (s_{t+1}, \mu_\phi(s_{t+1})) \big] .}
 ```
 Similarily to DQN, DDPG also employs the same replay buffer mechanism, to reuse past transitions over training for increased sample efficiency and estimate the loss function via MC-estimates.
 
-Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with <span class="highlight">maximizing the discounted cumulative reward, while acting as randomly as possible</span>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $J (\pi)$ to specifically account for the policy entropy, $\htmlId{J-soft}{J(\pi) = \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))]}$ This modified objective results in the *soft* TD-target:
+Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with <span class="highlight">maximizing the discounted cumulative reward, while acting as randomly as possible</span>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $J (\pi)$ to specifically account for the policy entropy,
+``` math
+\begin{align}
+    J(\pi) &= \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))] 
+\end{align}
+```
+
+This modified objective results in the *soft* TD-target:
+
 ``` math
 \htmlId{soft-td-target}{y_i = \mathbb E_{s_{t+1} \sim \mathbb P( \bullet \vert s_t, a_t)} [r_t + \gamma \left( Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) - \alpha \log \pi_\phi(a_{t+1} \vert s_{t+1}) \right)], \quad a_{t+1} \sim \pi_\phi(\bullet \vert s_t)}
 ```
@@ -676,7 +709,7 @@ Lastly, in order to improve on the robustness of their approach to different goa
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="hil-serl-blocks" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="hil-serl-blocks" style="position: absolute;"></span>
 <figcaption>(A) HIL-SERL allows for real-world training of high performance RL agents by building on top advancements presented by of SAC, RLPD and SERL. (B) Example of human intervention during a HIL-SERL training process on a SO-100.</figcaption>
 </figure>
 
@@ -721,7 +754,7 @@ TL;DR Behavioral Cloning provides a natural platform to learn from real-world in
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-bc-trajectories" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-bc-trajectories" style="position: absolute;"></span>
 <figcaption>(A) Average (with standard deviation) evolution of the actuation levels over the first 5 recorded episodes in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Proprioperceptive state provide invaluable to determine the robot’s state during an episode. (B) Camera frames are also recorded alongside measurements on the robot’s state, capturing information about the robot’s interaction with its environment.</figcaption>
 </figure>
 
@@ -737,7 +770,7 @@ Formally, let $\mathcal D = \{ \tau^{(i)} \}_{i=1}^N$ be a set of expert traject
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-observation-action-mapping" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-observation-action-mapping" style="position: absolute;"></span>
 <figcaption>Sample observations and action pairs over the course of a given trajectory recorded in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Observations, comprising of both proprioperceptive and visual information, are recorded alongside the configuration of a second, leader robot controlled by a human expert, providing complete information for regressing actions given observation.</figcaption>
 </figure>
 
@@ -759,7 +792,7 @@ Despite the inherent challenges of learning on non-i.i.d. data, the BC formulati
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-issues-with-bc" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-issues-with-bc" style="position: absolute;"></span>
 <figcaption>Point-wise policies suffer from limitations due to (A) covariate shifts and poor approximation of (B) multimodal demonstrations. (A) Initially small errors may drive the policy out of distribution, incuring in a vicious circle ultimately resulting in failure. (B) Both modes of reaching for a target object in a scene, either left or right-first, are equally as good and thus equally as likely to be present in a dataset of human demonstrations, ultimately resulting in multimodal demonstrations.</figcaption>
 </figure>
 
@@ -779,7 +812,7 @@ Generative Models (GMs) aim to learn the stochastic process underlying the very
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-task-effect-on-pairs" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-task-effect-on-pairs" style="position: absolute;"></span>
 <figcaption>Intuitively, latent variable in a single latent model may contain information regarding the task being performed, which directly results in the likelihood of the same observation-action pair being different for two different tasks. When (A) picking a block the likelihood of a wide gripper’s opening should be higher than narrower one, while it should be the opposite when (B) pushing the block.</figcaption>
 </figure>
 
@@ -797,41 +830,64 @@ Intuitively, in the case of observation-action pairs $(o, a)$ for a robotics app
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-latent-variable-model" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-latent-variable-model" style="position: absolute;"></span>
 <figcaption>(A) The latent variable model in a robotics application regulates influence between observed (<span class="math inline"> <em>o</em>, <em>a</em>)</span> variables and an unobservable latent variable. (B) VAEs approximate exact latent variable models by means of variational inference.</figcaption>
 </figure>
 
-Given a dataset $\mathcal D$ consisting of $N$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $\theta$ (in Bayesian terms, the *evidence* $p_\theta(\mathcal D)$) can thus be written as: 
-
-$$
-`\htmlId{evidence-definition-1}{\log p_\theta(\mathcal D) = \log \sum_{i=0}^N p_\theta ((o,a)_i)\\ = \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z)\\ = \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z)\\ = \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)],}`
-$$
-
- where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
+Given a dataset $\mathcal D$ consisting of $N$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $\theta$ (in Bayesian terms, the *evidence* $p_\theta(\mathcal D)$) can thus be written as:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &= \log \sum_{i=0}^N p_\theta ((o,a)_i) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)], 
+\end{align}
+```
+where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
 
 In the special case where one assumes distributions to be tractable, $p_\theta (\mathcal D)$ is typically tractable too, and $\max_\theta \log p_\theta(\mathcal D)$ provides a natural target for (point-wise) infering the unknown parameters $\theta$ of the generative model. Unfortunately, <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> is rarely tractable when the distribution $p$ is modeled with approximators such as neural networks, especially for high-dimensional, unstructured data.
 
 In their seminal work on Variational Auto-Encoders (VAEs), @kingmaAutoEncodingVariationalBayes2022 present two major contributions to learn complex latent-variable GMs on unstructured data, proposing (1) a tractable, variational lower-bound to <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> as an optimization target to jointly learn likelihood and posterior and (2) high-capacity function approximators to model the likelihood $p_\theta(o,a\vert z)$ and (approximate) posterior distribution $q_\phi(z \vert o,a) \approx q_\theta(z \vert o,a)$.
 
-In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]$--yielding: 
+In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]$--yielding:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &\geq \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+            + \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} [\log \left( \frac{p(z)}{q_\theta(z \vert (o,a)_i)} \right)]
+        \right) \\
+        &= \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+        - \text{D}_{\text{KL}}\big[ q_\theta(z \vert (o,a)_i) \Vert p(z) \big]
+        \right) 
+\end{align}
+```
 
-$$
-`\htmlId{ELBO-intractable}{\log p_\theta(\mathcal D) \geq \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] + \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} [\log \left( \frac{p(z)}{q_\theta(z \vert (o,a)_i)} \right)] \right)\\ = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] - \text{D}_{\text{KL}}\big[ q_\theta(z \vert (o,a)_i) \Vert p(z) \big] \right)}`
-$$
+The true, generally intractable posterior $p_\theta (z \vert o,a)$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $q_\phi(z \vert o,a)$, resulting in the final, tractable ELBO objective,
 
- The true, generally intractable posterior $p_\theta (z \vert o,a)$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $q_\phi(z \vert o,a)$, resulting in the final, tractable ELBO objective, $\htmlId{ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim q_\phi(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] - \text{D}_{\text{KL}}\big[ q_\phi(z \vert (o,a)_i) \Vert p(z) \big] \right)}$ From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $q_\phi$ as a Gaussian $q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)$ and (2) imposing a standard Gaussian prior on the latent space, $p(z) = \mathcal N(\mathbf{0}, \mathbf{I})$.
+``` math
+\begin{align}
+\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim q_\phi(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+        - \text{D}_{\text{KL}}\big[ q_\phi(z \vert (o,a)_i) \Vert p(z) \big]
+        \right)
+        
+\end{align}
+```
+From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $q_\phi$ as a Gaussian $q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)$ and (2) imposing a standard Gaussian prior on the latent space, $p(z) = \mathcal N(\mathbf{0}, \mathbf{I})$.
 
 An intuitive explanation of the learning dynamics of VAEs can be given considering the equivalent case of *minimizing the negative ELBO*, which admits a particularly interpretable factorization
 
-
-
-$$
-`\htmlId{VAE-min-neg-ELBO}{\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) = \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi)\\ \mathbf{L^{\text{rec}}}(\theta) = \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]\\ \mathbf{L^{\text{reg}}}(\phi) = \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big]}`
-$$
-
-
+``` math
+\begin{align}
+\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) &= \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi) \\
+\mathbf{L^{\text{rec}}}(\theta) &= \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]  \\
+\mathbf{L^{\text{reg}}}(\phi) &= \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big] 
+\end{align}
+```
 
 For any given $(o,a)$ pair, the expected value term of <a href="#VAE-Lrec" data-reference-type="ref" data-reference="VAE-Lrec">[VAE-Lrec]</a> is typically computed via MC estimates, resulting in
+
 ``` math
 -\mathbb{E}_{z \sim q_\phi(\bullet \vert o,a)} \big[ \log p_\theta(o,a \vert z) \big] = \mathbf{L^{\text{rec}}} \approx - \frac{1}{n} \sum_{i=0}^n \log p_\theta(o,a \vert z_i).
 ```
@@ -843,13 +899,14 @@ Indeed, it is very common in practice to approximate from the learned likelihood
 
 #### Diffusion Models
 
-VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $p_\theta$ and (approximate) posterior $q_\phi$ for such model. In that, the unknown data distribution $p(o,a)$ is effectively approximated via $\int_Z p(z) p_\theta(o,a \vert z)$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $p(o,a)$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $o,a$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in 
-
-$$
-`\htmlId{BC-multi-latent-model-1}{p(\underbrace{o,a}_{= z_0}) = \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)\\ p(z_0, z_1, \dots z_T) = p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t),}`
-$$
-
- where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
+VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $p_\theta$ and (approximate) posterior $q_\phi$ for such model. In that, the unknown data distribution $p(o,a)$ is effectively approximated via $\int_Z p(z) p_\theta(o,a \vert z)$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $p(o,a)$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $o,a$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in
+``` math
+\begin{align}
+    p(\underbrace{o,a}_{= z_0}) &= \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)  \\ 
+    p(z_0, z_1, \dots z_T) &= p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t), 
+\end{align}
+```
+where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
 
 <figure>
 <ResponsiveImage
@@ -859,7 +916,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-many-latents" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-many-latents" style="position: absolute;"></span>
 <figcaption>HMLV models posit the data generation process is influenced by a stack of Markov-dependent latent variables, with samples from the posterior distribution being progressively higher up in the hierarchy.</figcaption>
 </figure>
 
@@ -867,13 +924,16 @@ Similarily to VAEs, providing an exact interpretation for the latent variables i
 
 Just like VAEs, DMs attemp to learn to reproduce an underlying data distribution $p (o,a)$ given a collection of i.i.d. samples approximating the model posited to have generated the data in the first place ( <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>). Similarily to VAEs, DMs approximate the process of sampling from the unknown $p(o,a)$ (1) sampling from an easy-to-sample distribution (e.g., Gaussian) and (2) learning to reconstruct high-likelihood samples under the unknown distribution. However, in stark contrast with VAEs, the easy-to-sample distribution contains *no mutual information* regarding the data distribution $p(o,a)$. Crucially, as no information from the sample $(o,a)$ (denoted as $z_0 \equiv (o,a)$ for the sake of notation) is assumed to be propagated throughout the chain of latents, the posterior $q(z_t \vert z_{t-1})$ assumes a relatively amicable structure in DMs, reducing complexity. The *true* likelihood $p(z_{t-1} \vert z_t)$ is instead typically approximated using the parametrization $p_\theta (z_{t-1} \vert z_t)$. In that, the information contained in the unknwon data distribution is *reconstructed* via a process in which samples from a fixed distribution are turned into (ideally) high-likelihood samples under $p(o,a)$--a process referred to as *denoising*.
 
-Under such model, we can express the log-likelihood of an arbitrary sample as[^4] 
-
-$$
-`\htmlId{diffusion-likelihood}{\log p_\theta (\underbrace{o,a}_{= z_0}) = \mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -\\ \mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag\\ \sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag}`
-$$
-
- providing an optimization target in the form of $\max_\theta \log p_\theta (\mathcal D)$.
+Under such model, we can express the log-likelihood of an arbitrary sample as[^4]
+``` math
+\begin{align}
+    \log p_\theta (\underbrace{o,a}_{= z_0}) = 
+    &\mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -  \\
+    &\mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag \\ 
+    &\sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag
+\end{align}
+```
+providing an optimization target in the form of $\max_\theta \log p_\theta (\mathcal D)$.
 
 In their seminal work on using DMs for variational inference, @hoDenoisingDiffusionProbabilistic2020 introduce major contributions regarding solving $\min_\theta -\log p_\theta(o,a)$. In particular, @hoDenoisingDiffusionProbabilistic2020 exclusively adopt a fixed *Gaussian* posterior in the form of $q(z_t \vert z_{t-1}) = \mathcal{N}(\sqrt{1-\beta_t}z_{t-1}, \beta_t \mathbf I)$. The choice of adopting Gaussians has profound implications on the generative process modeled. Indeed, under the (mild) assumption that the variance is sufficiently small $\beta_t \leq \eta, \eta \in \mathbb R^+$, @sohl-dicksteinDeepUnsupervisedLearning2015 proved that the likelihood $p(z_{t-1} \vert z_t)$ is Gaussian as well, which allows for the particularly convenient parametrization of the approximate likelihood $p_\theta (x_{t-1} \vert x_t) = \mathcal N(\mu_\theta(x_t, t), \Sigma_\theta(x_t,t)), \ t \in [1,T]$, as well as for closed-form tractability of the KL-divergence terms in <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a>. Further, the posterior’s structure also enables an analytical description for the distribution of the $t$-th latent variable, $q(z_t \vert z_0) = \mathcal N (\sqrt{\bar{\alpha}_t}z_0, (1-\bar{\alpha}_t) \mathbf{I})$, with $\alpha_t = 1-\beta_t, \ \bar \alpha_t = \prod_{k=1}^t \alpha_k$, which conveniently prevents iterative posterior sampling.
 
@@ -885,7 +945,7 @@ In their seminal work on using DMs for variational inference, @hoDenoisingDiffu
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="diffusion-robot-actions" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="diffusion-robot-actions" style="position: absolute;"></span>
 <figcaption>DMs iteratively corrupt samples (left) from an unknown distribution into a quasi-standard Gaussian (center), learning the displacement field (right) that permits to reconstruct samples from the unknown target distribution by iteratively denoising samples of a tractable, easy-to-sample distribution.</figcaption>
 </figure>
 
@@ -899,29 +959,45 @@ Finally, adopting Gaussian posteriors permits a particularly pleasing interpreta
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-action-vs-observation-distribution" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-action-vs-observation-distribution" style="position: absolute;"></span>
 <figcaption>A joint action-observation distribution, in the simplified case where the observation is the elbow-flex actuation in a SO-100, and the action is the recorded position for the same joint in the teleoperator arm. The motion recorded being teleoperated, the points distribute along a the diagonal.</figcaption>
 </figure>
 
-Because the recorded behavior is teleoperated, measurements mostly distribute along the line $a = o + \eta, \eta \sim N(0,1)$, with $\eta$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $\mathcal O\times \mathcal A$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective: $\htmlId{diffusion-simplified-loss}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[ \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} z_0 + \epsilon \sqrt{1 - \bar \alpha_t}, t) \Vert^2 \big], \quad t \sim \mathcal{U}(\{1,\dots,T\}), \quad z_0 \sim \mathcal{D}, \quad \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).}$
+Because the recorded behavior is teleoperated, measurements mostly distribute along the line $a = o + \eta, \eta \sim N(0,1)$, with $\eta$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $\mathcal O\times \mathcal A$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective:
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[
+        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} z_0 + \epsilon \sqrt{1 - \bar \alpha_t}, t) \Vert^2 \big], \quad t \sim \mathcal{U}(\{1,\dots,T\}), \quad
+        z_0 \sim \mathcal{D}, \quad
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).
+\end{align}
+```
 
 In this simplified (minimization) objective, the optimization process differs from <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a> in that, rather than maxizing $p_\theta$ directly, the parameters $\theta$ of the pairwise likelihood $p_\theta(z_{t-1} \vert z_t)$ are adjusted to *predict the total displacement* $\epsilon$ for a randomly long ($t \sim \mathcal{U}(\{1,\dots,T\}$ )) diffusion process starting from a sample of the target distribution.
 
-By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($\Vert \epsilon \Vert > 0$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $p_\theta (z_{t-1} \vert z_t)$ is Gaussian, then sampling $z_{t-1} \sim p_\theta(\bullet \vert z_{t})$ corresponds to computing $\htmlId{diffusion-denoising-definition}{z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}),}$ thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $\epsilon_\theta(z_t, t)$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
+By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($\Vert \epsilon \Vert > 0$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $p_\theta (z_{t-1} \vert z_t)$ is Gaussian, then sampling $z_{t-1} \sim p_\theta(\bullet \vert z_{t})$ corresponds to computing
+``` math
+\begin{align}
+    z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}), 
+\end{align}
+```
+thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $\epsilon_\theta(z_t, t)$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
 
 #### Flow Matching
 
 <span id="ch4-flow-matching" style="position: absolute;"></span>
 
-The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $\psi [0,1] \times Z \mapsto Z$, formalized starting from possibly time-dependent vector field $v: [0,1] \times Z \mapsto Z$ transporting samples from a simple prior distribution $p_0$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $p_1$ over time. Note how FM models time $t \in [0,1]$ to be varying continuously while moving away *from* an easy-to-sample distribution $p_0$ *towards* the unknown data-distribution, $p_1$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time, 
-
-$$
-`\frac{d}{dt} \psi(z, t) = v(t, \psi(t, z))\\ \psi(0, z) = z`
-$$
-
-
+The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $\psi [0,1] \times Z \mapsto Z$, formalized starting from possibly time-dependent vector field $v: [0,1] \times Z \mapsto Z$ transporting samples from a simple prior distribution $p_0$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $p_1$ over time. Note how FM models time $t \in [0,1]$ to be varying continuously while moving away *from* an easy-to-sample distribution $p_0$ *towards* the unknown data-distribution, $p_1$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time,
+``` math
+\begin{align}
+    \frac{d}{dt} \psi(z, t) &= v(t, \psi(t, z)) \\
+    \psi(0, z) &= z
+\end{align}
+```
 
 FM proved very effective in a variety of applications, ranging from image @esserScalingRectifiedFlow2024 and video generation @polyakMovieGenCast2025 to robotics control @blackp0VisionLanguageActionFlow2024. Most notably, in their introductory work on FM for GM, @lipmanFlowMatchingGenerative2023 show how DMs can be seen as a specific instance of FM where the *conditional* target vector field $u$ approximated by the noise regressor corresponds to
+
 ``` math
 \htmlId{fm-diffusion-vector-field}{u(t, z\vert z_0) = \frac{\frac{d}{dt}\alpha(1-t)}{1 - (\alpha(1-t))^2}(\alpha(1-t)z - z_0), \quad \alpha(t) = e^{-\frac12 \int_0^t \beta(s) ds}, \quad \forall z_0 \in \mathcal D}
 ```
@@ -935,7 +1011,7 @@ Note that the traditional discrete-time noise-scheduler ${\beta_t}_{t=0}^T$ is n
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-normalizing-flows" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-normalizing-flows" style="position: absolute;"></span>
 <figcaption>Probability distributions can be modified applying vector fields resulting in a flow of mass in the support. When acting over time, vector fields can effectively change the distribution’s structure.</figcaption>
 </figure>
 
@@ -949,11 +1025,19 @@ While the noising schedule of DMs results in a stochastic process that resembles
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-diffusion-paths-versus-fm" style="position- absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-diffusion-paths-versus-fm" style="position: absolute;"></span>
 <figcaption>Compared to diffusion, flow matching distorts distribution along a less randomic pattern, resulting in a clearer interpolation between source and target distribution. The visualization shows an example comparison between these two methods on joint distribution of robot observations and actions over <span class="math inline"> <em>T</em> = 50</span> steps.</figcaption>
 </figure>
 
-In practice, FM can be applied to generative modeling by learning a vector field regressor $v_\theta(z, t)$ to approximate a given target vector field $u(t, z)$. In the particular case of DMs, $u(t, z)$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $z_1 \sim p_1$ and a sample from an easy-to-sample prior $z_0 \sim p_0$, CFM defines a simple path between them using *linear interpolation* between samples $z_t = (1-t)z_0 + t z_1$, resulting in the target vector field $u(t, z_t) = z_1 - z_0$. Then, a FM model can be trained with the simple regression objective defined as $\htmlId{flow-matching-objective}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[ \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),}$ where $z_0 \sim p_0(\bullet)$ and $z_1 \sim p_1(\bullet)$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $t \sim \mathcal U([0,1])$ rather than discretely $t \sim \mathcal U(\{0,1\})$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $z_0 \sim p_0$ and iteratively refined according to $\frac{dz}{dt} = v_\theta(z_t, t)$ for $t \in [0,1]$--an operation that can be numerically carried out with standard ODE solvers.
+In practice, FM can be applied to generative modeling by learning a vector field regressor $v_\theta(z, t)$ to approximate a given target vector field $u(t, z)$. In the particular case of DMs, $u(t, z)$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $z_1 \sim p_1$ and a sample from an easy-to-sample prior $z_0 \sim p_0$, CFM defines a simple path between them using *linear interpolation* between samples $z_t = (1-t)z_0 + t z_1$, resulting in the target vector field $u(t, z_t) = z_1 - z_0$. Then, a FM model can be trained with the simple regression objective defined as
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[
+        \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),
+\end{align}
+```
+where $z_0 \sim p_0(\bullet)$ and $z_1 \sim p_1(\bullet)$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $t \sim \mathcal U([0,1])$ rather than discretely $t \sim \mathcal U(\{0,1\})$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $z_0 \sim p_0$ and iteratively refined according to $\frac{dz}{dt} = v_\theta(z_t, t)$ for $t \in [0,1]$--an operation that can be numerically carried out with standard ODE solvers.
 
 ### Action Chunking with Transformers
 
@@ -961,7 +1045,17 @@ While GMs prove useful in learning complex, high-dimensional multi-modal distrib
 
 On the robot learning side of their contributions, @zhaoLearningFineGrainedBimanual2023 adopt transformers as the architectural backbone to learn a *Conditional* VAE @sohnLearningStructuredOutput2015. Conditional VAEs are a variation of the more standard VAE formulation introducing a conditioning variable on sampling from the latent prior, allowing the modeling of *one-to-many* relationships between latent and data samples. Further, in stark contrast with previous work @florenceImplicitBehavioralCloning2022, @jannerPlanningDiffusionFlexible2022, @zhaoLearningFineGrainedBimanual2023 do not learn a full joint $p_\theta(o,a)$ on observation and actions. While the *policy* distribution $p_\theta(a \vert o)$ can in principle be entirely described from its joint $p_\theta(o,a)$, it is often the case that the conditional distribution is intractable when using function approximators, as $p_\theta(a \vert o) = \tfrac{p_\theta(o,a)}{\int_\mathcal Ap_\theta(o,a)}$ and the integral in the denominator is typically intractable. Instead of modeling the full joint using a vanilla VAE, @zhaoLearningFineGrainedBimanual2023 propose learning a *conditional* VAE @sohnLearningStructuredOutput2015 modeling the policy distribution directly $p (a \vert o)$.
 
-In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to $\htmlId{c-ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim q_\phi(\cdot \vert o_i, a_i)} \big[ \log p_\theta(a_i \vert z, o_i) \big] - \text{D}_{\text{KL}}\big[ q_\phi(z \vert o_i, a_i) \Vert p_\omega(z \vert o_i) \big] \right)}$ Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $\omega$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $\beta$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $\beta$ results in a less expressive latent space.
+In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to
+``` math
+\begin{align}
+
+    \text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim q_\phi(\cdot \vert o_i, a_i)} \big[ \log p_\theta(a_i \vert z, o_i) \big]
+        - \text{D}_{\text{KL}}\big[ q_\phi(z \vert o_i, a_i) \Vert p_\omega(z \vert o_i) \big]
+        \right)
+\end{align}
+```
+Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $\omega$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $\beta$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $\beta$ results in a less expressive latent space.
 
 In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn from human demonstrations compared to a simpler, supervised objective, $\mathcal L_1(a,a^\prime) = \Vert a - a^\prime \Vert_1$. Interestingly, they found the performance of these two approaches to be comparable when learning from *scripted* demonstrations. That is, when learning from data collected rolling out a predetermined set of commands $[q^c_0, q^c_1, \dots]$, GM did *not* prove competitive compared to standard supervised learning. However, when learning from human demonstrations--i.e., from data collected executing commands coming from a human controller $[q^h_0, q^h_1, \dots]$--they found performance (success rate on a downstream task) to be severily (-33.3%) hindered from adopting a standard supervised learning objective compared to a richer, potentially more complex to learn variational objective, in keeping with the multimodal nature of human demonstrations data and findings presented in @florenceImplicitBehavioralCloning2022. The authors also ablate the action chunking paradigm, reporting significant performance gains for performing action chunking (1% vs. 44% success rate). To avoid acting openloop, @zhaoLearningFineGrainedBimanual2023 design an inference process consisting in performing inference at every timestep $t$ and then aggregate overlapping chunks using chunks’ exponential moving average.
 
@@ -973,7 +1067,7 @@ In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act" style="position: absolute;"></span>
 <figcaption>Action Chunking with Transformer (ACT), as in @zhaoLearningFineGrainedBimanual2023. ACT introduces an action chunking paradigm to cope with high-dimensional multi-modal demonstration data, and a transformer-based CVAE architecture.</figcaption>
 </figure>
 
@@ -987,7 +1081,7 @@ In ACT (Figure <a href="#ch4-act" data-reference-type="ref" data-reference="ch4
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act-encoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act-encoder" style="position: absolute;"></span>
 <figcaption>The CVAE encoder used in ACT. Input action chunks are first embedded and aggregated with positional embeddings, before being processed alongside embedded proprioperceptive information, and a learned <code>[CLS]</code> token used to aggregate input level information, and predict the style variable <span class="math inline"> <em>z</em> </span>. The encoder is entirely disregarded at inference time.</figcaption>
 </figure>
 
@@ -1001,7 +1095,7 @@ However, the authors claim using a deterministic procedure to derive $z$ may ben
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act-decoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act-decoder" style="position: absolute;"></span>
 <figcaption>The CVAE decoder used in ACT, comprising of a full encoder-decoder Transformer architecture. Camera observations from all <span class="math inline"> <em>n</em> </span> camera views are first embedded using pre-trained visual encoders, and then concatenated to the corresponding positional embeddings. Then, alongside embeddings for the proprioperceptive information available and the style variable <span class="math inline"> <em>z</em> </span> retrieved from the CVAE encoder, the Transformer encoder shares the matrices <span class="math inline"> <em>K</em>, <em>Q</em> </span> with the Transformer decoder, trained to decode fixed position embeddings into action valid chunks.</figcaption>
 </figure>
 
@@ -1011,13 +1105,17 @@ However, the authors claim using a deterministic procedure to derive $z$ may ben
 
 DMs proved very effective in approximating complex highly dimensional distributions, such as distributions over images @hoDenoisingDiffusionProbabilistic2020 or videos @polyakMovieGenCast2025, thanks to their inherent capability to deal with multimodal data and training stability. In Diffusion Policy (DP), @chiDiffusionPolicyVisuomotor2024 present an application of DMs the field of robot learning, leveraging diffusion to model human expert demonstrations in a variety of simulated and real-world tasks. Similarily to Action Chunking with Transformer @zhaoLearningFineGrainedBimanual2023, @chiDiffusionPolicyVisuomotor2024 (1) adopt a modified *observation-conditioned target distribution* instead of the full joint $p(o,a)$ and (2) predict multiple actions into the future instead of a single action. Besides the intractability of the observations’ marginal $p_\theta(o)$ given $p_\theta(o,a)$, DP’s rationale for modeling the data distribution via $p_\theta(a \vert o)$ stems from the rather test-time compute intensive nature of diffusion, whereby generating actions *alongside* observations is likely to result in higher complexity and thus a likely larger number of denoising operations, which would prove ultimately pointless considering robotics applications rely on the capability to generate controls rather than reproducing observations.
 
-In practice, conditioning on observation data is achieved conditioning the added noise regressor $\epsilon_\theta$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $T_o$ observations, resulting in the *conditional* simplified diffusion objective 
-
-$$
-`\htmlId{diffusion-policy-objective}{\mathcal L(\theta) = \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[ \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],\\ t \sim \mathcal{U}(\{1,\dots,T\}), \quad a_{t:t+T_a}, o_{t-T_o:t} \sim \mathcal{D}, \quad \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag}`
-$$
-
- Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $t$ *and* on a stack of previous observations $o_{t-T_o-t}$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
+In practice, conditioning on observation data is achieved conditioning the added noise regressor $\epsilon_\theta$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $T_o$ observations, resulting in the *conditional* simplified diffusion objective
+``` math
+\begin{align}
+    \mathcal L(\theta) &= \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[
+        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],  \\
+        & t \sim \mathcal{U}(\{1,\dots,T\}), \quad
+        a_{t:t+T_a}, o_{t-T_o:t} \sim \mathcal{D}, \quad
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag 
+\end{align}
+```
+Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $t$ *and* on a stack of previous observations $o_{t-T_o-t}$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
 
 <figure>
 <ResponsiveImage
@@ -1027,7 +1125,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="diffusion-policy-architecture" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="diffusion-policy-architecture" style="position: absolute;"></span>
 <figcaption>The Diffusion Policy archicture, as in @chiDiffusionPolicyVisuomotor2024. A stack of <span class="math inline"> <em>H</em> <sub> <em>o</em> </sub> </span> previous observations is used as external conditioning to denoise a group of <span class="math inline"> <em>H</em> <sub> <em>a</em> </sub> </span> actions. Conditioning is used at every layer of a U-Net block, and in practice allows to obtain fully-formed action chunks with as little as <span class="math inline"> <em>T</em> = 10</span> denoising steps.</figcaption>
 </figure>
 
@@ -1058,7 +1156,7 @@ We directly assess the lack of adaptiveness of robot systems due to acting open-
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-async-inference" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-async-inference" style="position: absolute;"></span>
 </div>
 <figcaption><strong>Asynchronous inference</strong>. Illustration of the asynchronous inference stack. Note that the policy can be run on a remote server, possibly with GPUs.</figcaption>
 </figure>
@@ -1101,7 +1199,7 @@ Interestingly, the behavior of async inference can be studied analytically. Firs
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-queues" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-queues" style="position: absolute;"></span>
 </div>
 <figcaption>Action queue size evolution at runtime for various levels of <span class="math inline"> <em>g</em> </span> when (A) not filtering out observation based on joint-space similarity and (B) filtering out near-duplicates observation, measuring their similarity in joint-space.</figcaption>
 </figure>
@@ -1135,7 +1233,7 @@ The advent of large models trained on internet-scale datasets has drastically in
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-ml-vs-robotics-foundation" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-ml-vs-robotics-foundation" style="position: absolute;"></span>
 <figcaption>Fields within ML such as Computer Vision and NLP converged on the development of foundation models, trained on a variety of large scale models and capable to perform multiple downstream tasks (top). Conversely, robotics suffered from limited standardization in terms of the architectures used, and siloed, task specific datasets, incurring in a high degree of fragmentation which traditionally hindered the development of generalist models for robotics in favour of task-specific models (bottom).</figcaption>
 </figure>
 
@@ -1151,7 +1249,7 @@ The remarkable success of foundation models in NLP and CV is predicated on two c
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-generalist-policies-timeline" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-generalist-policies-timeline" style="position: absolute;"></span>
 <figcaption>Early efforts in the development of generalist models for robotics include BC-Zero @jangBCZZeroShotTask2022, RT-1 @brohanRT1RoboticsTransformer2023, and RT-2 @brohanRT2VisionLanguageActionModels2023: large scale models trained on thousands of demonstrations. The open release of the Open-X @collaborationOpenXEmbodimentRobotic2025 and DROID datasets @khazatskyDROIDLargeScaleInTheWild2025 fostered the development of open source models: OpenVLA @kimOpenVLAOpenSourceVisionLanguageAction2024, <span class="math inline"> <em>π</em> <sub>0</sub> </span> @blackp0VisionLanguageActionFlow2024 and SmolVLA @shukorSmolVLAVisionLanguageActionModel2025.</figcaption>
 </figure>
 
@@ -1171,7 +1269,7 @@ The success of large, proprietary models like RT-1 and RT-2, highlighted a growi
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-trends" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-trends" style="position: absolute;"></span>
 <figcaption>Robot learning is undergoing a paradigmatic shift: centralized data collections (A, left) are increasingly larger, often comprising Ms of demonstrations, and (A, right) decentralized approaches to data collection are also rising as an alternative for large scale data collection. (B) Generalist models are also becoming increasingly smaller and easier to run on limited hardware.</figcaption>
 </figure>
 
@@ -1201,19 +1299,30 @@ $\pi_0$ @blackp0VisionLanguageActionFlow2024 introduce a VLA consisting of a Mo
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-pi0" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-pi0" style="position: absolute;"></span>
 <figcaption>The <span class="math inline"> <em>π</em> <sub>0</sub> </span>architecture, as in @blackp0VisionLanguageActionFlow2024. Vision and language tokens are routed to a VLM backbone which is prevented from attending robot proprioperceptive states and action tokens, which are instead routed to a smaller subset of weights within the architecture. The architecture is trained with Flow Matching on 10M+ trajectories from a mixture of closed and openly available datasets.</figcaption>
 </figure>
 
 Concretely, $\pi_0$ is a unified transformer with two disjoint sets of weights $\phi, \theta$. A larger VLM backbone $p_\phi$ initialized from Gemma 2.6B processes multiple image frames obtained from multiple cameras points $[\{ I_t \}_{t=1}^n]$, as well as a language instruction $[\ell_t]$ used to describe the task considered. Concurrently, a 300M-parameter *action expert* based on a similar transformer architecture is used processes the robot proprioperceptive state $q_t$ and an action chunk $a_{t:t+H_a}$ (Figure <a href="#ch5-pi0" data-reference-type="ref" data-reference="ch5-pi0">[ch5-pi0]</a>). The different expert networks operate separately in processing the respective inputs and turning them into query, key and value matrices, and only share information between each other via self-attention layers. The outputs from the VLM backbone are disregarded, while the vector field regressed by the action expert is used to iteratively refine the action process. In particular, $\pi_0$uses a *blockwise causal attention mask* over tokens belonging to three separate blocks: (1) image and language tokens $\mathcal T_i$ obtained from $[\{ I_t \}_{t=1}^n, \ell_t]$, (2) proprioperceptive tokens $\mathcal T_q$ obtained from $q_t$, and (3) the action tokens $\mathcal T_a$ for items in the chunk $a^{\tau}_{t:t+H_a}$ at time $\tau$ in the flow-matching process. Notably, *within* each block the attention operations are bidirectional, while across blocks, future blocks are masked out. Formally, this corresponds to using the attention mask $\mathbf{A} = \bordermatrix{ \mathcal{T}_i \mathcal{T}_q \mathcal{T}_a \cr \mathcal{T}_i \mathbf{1} \mathbf{0} \mathbf{0} \cr \mathcal{T}_q \mathbf{1} \mathbf{1} \mathbf{0} \cr \mathcal{T}_a \mathbf{1} \mathbf{1} \mathbf{1} \cr }, \quad \mathbf{1}: \text{Bidirectional Attention}, \ \mathbf{0}: \text{Masked Attention}$ Note how *intra*-block directional attention allows tokens to communicate freely, while *inter*-block communication is mediated by the attention mask $\mathbf{A}$. *Blockwise causal masking* effectively prevents the pre-trained perception-language tokens from attending to robotics-tokens, likely out of distribution for VLM backbones traditionally trained on large corpora of internet, non-robotics, data. Crucially, because communication is obstructed between image-language tokens, proprioperceptive and action tokens, one can cache keys and values across denoising steps at runtime time, incuring in a reduced computational footprint and faster inference.
 
-In $\pi_0$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing: 
+In $\pi_0$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing:
+``` math
+\begin{align}
+    \mathcal{L}(\phi, \theta) &= 
+    \mathbb{E}_{\tau, \epsilon, o_t, a_{t:t+H_a}}\Big[
+        \big\Vert 
+            v_\theta(\underbrace{\tau a_{t:t+H_a} + (1-\tau) \epsilon}_{\tilde a_{t:t+H_a}},\, o_t,\, \tau)
+            - (\epsilon - a_{t:t+H_a})
+        \big\Vert^2
+    \Big],  \\
+    &\tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad
+    \epsilon \sim \mathcal{N}(\mathbf{0}, \mathbf{I}), \quad
+    o_t, a_{t:t+H_a} \sim \mathcal D \notag
+\end{align}
+```
 
-$$
-`\htmlId{pi0-loss}{\mathcal{L}(\phi, \theta) = \mathbb{E}_{\tau, \epsilon, o_t, a_{t:t+H_a}}\Big[ \big\Vert v_\theta(\underbrace{\tau a_{t:t+H_a} + (1-\tau) \epsilon}_{\tilde a_{t:t+H_a}},\, o_t,\, \tau) - (\epsilon - a_{t:t+H_a}) \big\Vert^2 \Big],\\ \tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad \epsilon \sim \mathcal{N}(\mathbf{0}, \mathbf{I}), \quad o_t, a_{t:t+H_a} \sim \mathcal D \notag}`
-$$
+Where the experts parametrized by the separate weights $\phi, \theta$ interact with each other via self-attention layers only, so that the action expert $v_\theta$ internal computations also depend on the VLM backbone’s parameters $\phi$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
 
- Where the experts parametrized by the separate weights $\phi, \theta$ interact with each other via self-attention layers only, so that the action expert $v_\theta$ internal computations also depend on the VLM backbone’s parameters $\phi$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
 ``` math
 \begin{equation}
     a_{t:t+H_a}^{\tau + \delta} = a_{t:t+H_a}^{\tau } + \delta v_\theta(a_{t:t+H_a}^{\tau }, o_t)
@@ -1255,7 +1364,7 @@ VLAs remain in an early stage of development and are not yet as mature or widely
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-smolvla" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-smolvla" style="position: absolute;"></span>
 <figcaption>The SmolVLA architecture, as in @shukorSmolVLAVisionLanguageActionModel2025. SmolVLA is a compact MoE model trained with flow matching to denoise action chunks. Vision and language tokens are fed to a VLM backbone, and share information with the proprioperceptive and action tokens via the attention mechanism. The attention expert interleaves SA and CA layers for further conditioning on the visual features from the VLM backbone. SmolVLA skips computations and reduces the visual tokens, resulting in 6x less memory usage than <span class="math inline"> <em>π</em> <sub>0</sub> </span>.</figcaption>
 </figure>
 
diff --git a/app/scripts/latex-to-markdown/package-lock.json b/app/scripts/latex-to-mdx/package-lock.json
similarity index 100%
rename from app/scripts/latex-to-markdown/package-lock.json
rename to app/scripts/latex-to-mdx/package-lock.json
diff --git a/app/scripts/latex-to-markdown/package.json b/app/scripts/latex-to-mdx/package.json
similarity index 65%
rename from app/scripts/latex-to-markdown/package.json
rename to app/scripts/latex-to-mdx/package.json
index 38618b31ca768a7c349ebe774ae58e31196bd6b1..16850d0a30f47e351a3303970a7ce3a2a881abb5 100644
Binary files a/app/scripts/latex-to-markdown/package.json and b/app/scripts/latex-to-mdx/package.json differ
diff --git a/app/scripts/latex-to-markdown/post-processor.mjs b/app/scripts/latex-to-mdx/post-processor.mjs
similarity index 82%
rename from app/scripts/latex-to-markdown/post-processor.mjs
rename to app/scripts/latex-to-mdx/post-processor.mjs
index 262404ed25cd8a683f7e2c88513a9f183db5205b..be91e72eda5e8d2d0856871251b76d706eb1751f 100644
--- a/app/scripts/latex-to-markdown/post-processor.mjs
+++ b/app/scripts/latex-to-mdx/post-processor.mjs
@@ -68,6 +68,45 @@ function fixMathCommands(content) {
         .replace(/\\vdots/g, '\\vdots'); // This one should be fine, but kept for consistency
 }
 
+/**
+ * Convert LaTeX matrix commands to KaTeX-compatible environments
+ * @param {string} content - Markdown content
+ * @returns {string} - Content with fixed matrix commands
+ */
+function fixMatrixCommands(content) {
+    console.log('  🔢 Converting matrix commands to KaTeX format...');
+
+    let fixedCount = 0;
+
+    // Convert \pmatrix{...} to \begin{pmatrix}...\end{pmatrix}
+    content = content.replace(/\\pmatrix\{([^{}]*(?:\{[^{}]*\}[^{}]*)*)\}/g, (match, matrixContent) => {
+        fixedCount++;
+        // Split by \\ for rows, handle nested braces
+        const rows = matrixContent.split('\\\\').map(row => row.trim()).filter(row => row);
+        return `\\begin{pmatrix}\n${rows.join(' \\\\\n')}\n\\end{pmatrix}`;
+    });
+
+    // Convert \bmatrix{...} to \begin{bmatrix}...\end{bmatrix}
+    content = content.replace(/\\bmatrix\{([^{}]*(?:\{[^{}]*\}[^{}]*)*)\}/g, (match, matrixContent) => {
+        fixedCount++;
+        const rows = matrixContent.split('\\\\').map(row => row.trim()).filter(row => row);
+        return `\\begin{bmatrix}\n${rows.join(' \\\\\n')}\n\\end{bmatrix}`;
+    });
+
+    // Convert \vmatrix{...} to \begin{vmatrix}...\end{vmatrix}
+    content = content.replace(/\\vmatrix\{([^{}]*(?:\{[^{}]*\}[^{}]*)*)\}/g, (match, matrixContent) => {
+        fixedCount++;
+        const rows = matrixContent.split('\\\\').map(row => row.trim()).filter(row => row);
+        return `\\begin{vmatrix}\n${rows.join(' \\\\\n')}\n\\end{vmatrix}`;
+    });
+
+    if (fixedCount > 0) {
+        console.log(`    ✅ Fixed ${fixedCount} matrix command(s)`);
+    }
+
+    return content;
+}
+
 /**
  * Fix Unicode characters that break MDX/JSX parsing
  * @param {string} content - Markdown content
@@ -102,13 +141,18 @@ function fixMultilineMath(content) {
     console.log('  📏 Fixing multiline math expressions for MDX...');
 
     return content
-        // Convert multiline inline math to display math blocks
-        .replace(/\$([^$]*?\\\\[^$]*?)\$/gs, (match, mathContent) => {
-            // Remove leading/trailing whitespace and normalize newlines
-            const cleanedMath = mathContent
-                .replace(/^\s+|\s+$/g, '')
-                .replace(/\s*\\\\\s*/g, '\\\\\n    ');
-            return `$$\n${cleanedMath}\n$$`;
+        // Convert multiline inline math to display math blocks (more precise regex)
+        // Only match if the content is a self-contained math expression within a single line
+        .replace(/\$([^$\n]*\\\\[^$\n]*)\$/g, (match, mathContent) => {
+            // Only convert if it contains actual math operators and line breaks
+            if (mathContent.includes('\\\\') && /[=+\-*/^_{}]/.test(mathContent)) {
+                // Remove leading/trailing whitespace and normalize newlines
+                const cleanedMath = mathContent
+                    .replace(/^\s+|\s+$/g, '')
+                    .replace(/\s*\\\\\s*/g, '\\\\\n    ');
+                return `$$\n${cleanedMath}\n$$`;
+            }
+            return match; // Keep original if it doesn't look like multiline math
         })
         // Ensure display math blocks are properly separated
         .replace(/\$\$\s*\n\s*([^$]+?)\s*\n\s*\$\$/g, (match, mathContent) => {
@@ -272,6 +316,7 @@ export function postProcessMarkdown(content, inputDir = null) {
     processedContent = simplifyLatexDelimiters(processedContent);
     processedContent = removeOrphanedLabels(processedContent);
     processedContent = fixMathCommands(processedContent);
+    processedContent = fixMatrixCommands(processedContent);
     processedContent = fixUnicodeIssues(processedContent);
     processedContent = fixMultilineMath(processedContent);
     processedContent = fixAllAttributes(processedContent);
diff --git a/app/scripts/latex-to-markdown/reference-preprocessor.mjs b/app/scripts/latex-to-mdx/reference-preprocessor.mjs
similarity index 100%
rename from app/scripts/latex-to-markdown/reference-preprocessor.mjs
rename to app/scripts/latex-to-mdx/reference-preprocessor.mjs
diff --git a/app/src/components/Hero.astro b/app/src/components/Hero.astro
index 6484663672e6815fea4e9b8e3881e3255a97bc09..454b0d83584b1d19c4b0148dce5d1da9796dbb5b 100644
--- a/app/src/components/Hero.astro
+++ b/app/src/components/Hero.astro
@@ -5,26 +5,49 @@ interface Props {
   title: string; // may contain HTML (e.g., <br/>)
   titleRaw?: string; // plain title for slug/PDF (optional)
   description?: string;
-  authors?: Array<string | { name: string; url?: string; affiliationIndices?: number[] }>;
+  authors?: Array<
+    string | { name: string; url?: string; affiliationIndices?: number[] }
+  >;
   affiliations?: Array<{ id: number; name: string; url?: string }>;
   affiliation?: string; // legacy single affiliation
   published?: string;
   doi?: string;
 }
 
-const { title, titleRaw, description, authors = [], affiliations = [], affiliation, published, doi } = Astro.props as Props;
+const {
+  title,
+  titleRaw,
+  description,
+  authors = [],
+  affiliations = [],
+  affiliation,
+  published,
+  doi,
+} = Astro.props as Props;
 
 type Author = { name: string; url?: string; affiliationIndices?: number[] };
 
-function normalizeAuthors(input: Array<string | { name?: string; url?: string; link?: string; affiliationIndices?: number[] }>): Author[] {
+function normalizeAuthors(
+  input: Array<
+    | string
+    | {
+        name?: string;
+        url?: string;
+        link?: string;
+        affiliationIndices?: number[];
+      }
+  >,
+): Author[] {
   return (Array.isArray(input) ? input : [])
     .map((a) => {
-      if (typeof a === 'string') {
+      if (typeof a === "string") {
         return { name: a } as Author;
       }
-      const name = (a?.name ?? '').toString();
+      const name = (a?.name ?? "").toString();
       const url = (a?.url ?? a?.link) as string | undefined;
-      const affiliationIndices = Array.isArray((a as any)?.affiliationIndices) ? (a as any).affiliationIndices : undefined;
+      const affiliationIndices = Array.isArray((a as any)?.affiliationIndices)
+        ? (a as any).affiliationIndices
+        : undefined;
       return { name, url, affiliationIndices } as Author;
     })
     .filter((a) => a.name && a.name.trim().length > 0);
@@ -35,35 +58,41 @@ const normalizedAuthors: Author[] = normalizeAuthors(authors as any);
 // Determine if affiliation superscripts should be shown (only when there are multiple distinct affiliations referenced by authors)
 const authorAffiliationIndexSet = new Set<number>();
 for (const author of normalizedAuthors) {
-  const indices = Array.isArray(author.affiliationIndices) ? author.affiliationIndices : [];
+  const indices = Array.isArray(author.affiliationIndices)
+    ? author.affiliationIndices
+    : [];
   for (const idx of indices) {
-    if (typeof idx === 'number') {
+    if (typeof idx === "number") {
       authorAffiliationIndexSet.add(idx);
     }
   }
 }
 const shouldShowAffiliationSupers = authorAffiliationIndexSet.size > 1;
-const hasMultipleAffiliations = Array.isArray(affiliations) && affiliations.length > 1;
+const hasMultipleAffiliations =
+  Array.isArray(affiliations) && affiliations.length > 1;
 
 function stripHtml(text: string): string {
-  return String(text || '').replace(/<[^>]*>/g, '');
+  return String(text || "").replace(/<[^>]*>/g, "");
 }
 
 function slugify(text: string): string {
-  return String(text || '')
-    .normalize('NFKD')
-    .replace(/\p{Diacritic}+/gu, '')
-    .toLowerCase()
-    .replace(/[^a-z0-9]+/g, '-')
-    .replace(/^-+|-+$/g, '')
-    .slice(0, 120) || 'article';
+  return (
+    String(text || "")
+      .normalize("NFKD")
+      .replace(/\p{Diacritic}+/gu, "")
+      .toLowerCase()
+      .replace(/[^a-z0-9]+/g, "-")
+      .replace(/^-+|-+$/g, "")
+      .slice(0, 120) || "article"
+  );
 }
 
 const pdfBase = titleRaw ? stripHtml(titleRaw) : stripHtml(title);
 const pdfFilename = `${slugify(pdfBase)}.pdf`;
 ---
+
 <section class="hero">
-  <h1 class="hero-title" set:html={title}></h1>
+  <h1 class="hero-title" set:html={title} />
   <div class="hero-banner">
     <HtmlEmbed src="banner.html" frameless />
     {description && <p class="hero-desc">{description}</p>}
@@ -72,53 +101,81 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
 
 <header class="meta" aria-label="Article meta information">
   <div class="meta-container">
-    {normalizedAuthors.length > 0 && (
-      <div class="meta-container-cell">
-        <h3>Author{normalizedAuthors.length > 1 ? 's' : ''}</h3>
-        <ul class="authors">
-          {normalizedAuthors.map((a, i) => {
-            const supers = shouldShowAffiliationSupers && Array.isArray(a.affiliationIndices) && a.affiliationIndices.length
-              ? <sup>{a.affiliationIndices.join(',')}</sup>
-              : null;
-            return (
-              <li>
-                {a.url ? <a href={a.url}>{a.name}</a> : a.name}{supers}
-              </li>
-            );
-          })}
-        </ul>
-      </div>
-    )}
-    {(Array.isArray(affiliations) && affiliations.length > 0) && (
-      <div class="meta-container-cell">
-        <h3>Affiliation{affiliations.length > 1 ? 's' : ''}</h3>
-        {hasMultipleAffiliations ? (
-          <ol class="affiliations">
-            {affiliations.map((af) => (
-              <li value={af.id}>{af.url ? <a href={af.url} target="_blank" rel="noopener noreferrer">{af.name}</a> : af.name}</li>
-            ))}
-          </ol>
-        ) : (
-          <p>
-            {affiliations[0]?.url 
-              ? <a href={affiliations[0].url} target="_blank" rel="noopener noreferrer">{affiliations[0].name}</a> 
-              : affiliations[0]?.name}
-          </p>
-        )}
-      </div>
-    )}
-    {(!affiliations || affiliations.length === 0) && affiliation && (
-      <div class="meta-container-cell">
-        <h3>Affiliation</h3>
-        <p>{affiliation}</p>
-      </div>
-    )}
-    {published && (
-      <div class="meta-container-cell meta-container-cell--published">
-        <h3>Published</h3>
-        <p>{published}</p>
-      </div>
-    )}
+    {
+      normalizedAuthors.length > 0 && (
+        <div class="meta-container-cell">
+          <h3>Author{normalizedAuthors.length > 1 ? "s" : ""}</h3>
+          <ul class="authors">
+            {normalizedAuthors.map((a, i) => {
+              const supers =
+                shouldShowAffiliationSupers &&
+                Array.isArray(a.affiliationIndices) &&
+                a.affiliationIndices.length ? (
+                  <sup>{a.affiliationIndices.join(",")}</sup>
+                ) : null;
+              return (
+                <li>
+                  {a.url ? <a href={a.url}>{a.name}</a> : a.name}
+                  {supers}
+                </li>
+              );
+            })}
+          </ul>
+        </div>
+      )
+    }
+    {
+      Array.isArray(affiliations) && affiliations.length > 0 && (
+        <div class="meta-container-cell">
+          <h3>Affiliation{affiliations.length > 1 ? "s" : ""}</h3>
+          {hasMultipleAffiliations ? (
+            <ol class="affiliations">
+              {affiliations.map((af) => (
+                <li value={af.id}>
+                  {af.url ? (
+                    <a href={af.url} target="_blank" rel="noopener noreferrer">
+                      {af.name}
+                    </a>
+                  ) : (
+                    af.name
+                  )}
+                </li>
+              ))}
+            </ol>
+          ) : (
+            <p>
+              {affiliations[0]?.url ? (
+                <a
+                  href={affiliations[0].url}
+                  target="_blank"
+                  rel="noopener noreferrer"
+                >
+                  {affiliations[0].name}
+                </a>
+              ) : (
+                affiliations[0]?.name
+              )}
+            </p>
+          )}
+        </div>
+      )
+    }
+    {
+      (!affiliations || affiliations.length === 0) && affiliation && (
+        <div class="meta-container-cell">
+          <h3>Affiliation</h3>
+          <p>{affiliation}</p>
+        </div>
+      )
+    }
+    {
+      published && (
+        <div class="meta-container-cell meta-container-cell--published">
+          <h3>Published</h3>
+          <p>{published}</p>
+        </div>
+      )
+    }
     <!-- {doi && (
       <div class="meta-container-cell">
         <h3>DOI</h3>
@@ -128,7 +185,12 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
     <div class="meta-container-cell meta-container-cell--pdf">
       <h3>PDF</h3>
       <p>
-        <a class="button" href={`/${pdfFilename}`} download={pdfFilename} aria-label={`Download PDF ${pdfFilename}`}>
+        <a
+          class="button"
+          href={`/${pdfFilename}`}
+          download={pdfFilename}
+          aria-label={`Download PDF ${pdfFilename}`}
+        >
           Download PDF
         </a>
       </p>
@@ -136,7 +198,6 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
   </div>
 </header>
 
-
 <style>
   /* Hero (full-width) */
   .hero {
@@ -185,7 +246,7 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
     text-underline-offset: 2px;
     text-decoration-thickness: 0.06em;
     text-decoration-color: var(--link-underline);
-    transition: text-decoration-color .15s ease-in-out;
+    transition: text-decoration-color 0.15s ease-in-out;
   }
   .meta-container a:hover {
     text-decoration-color: var(--link-underline-hover);
@@ -205,11 +266,11 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
     font-weight: 400;
     color: var(--muted-color);
     text-transform: uppercase;
-    letter-spacing: .02em;
+    letter-spacing: 0.02em;
   }
   .meta-container-cell p {
     margin: 0;
-  } 
+  }
   .authors {
     margin: 0;
     list-style-type: none;
@@ -227,12 +288,10 @@ const pdfFilename = `${slugify(pdfBase)}.pdf`;
     flex-wrap: wrap;
     row-gap: 12px;
   }
-  
+
   @media print {
     .meta-container-cell--pdf {
       display: none !important;
     }
   }
 </style>
-
-
diff --git a/app/src/content/article.mdx b/app/src/content/article.mdx
index 4eb0c151f674be4e9c1b5e21bc569f85e9da7f86..9ad4c1e32ebca86fca36c154b9262b785a19a0ae 100644
--- a/app/src/content/article.mdx
+++ b/app/src/content/article.mdx
@@ -89,7 +89,7 @@ We sincerely hope this tutorial serves as a valuable starting point for your jou
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="figure1" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="figure1" style="position: absolute;"></span>
 <figcaption><code>lerobot</code> is the open-source library for end-to-end robotics developed by Hugging Face. The library is vertically integrated on the entire robotics stack, supporting low-level control of real-world robot devices, advanced data and inference optimizations, as well as SOTA robot learning methods with simple implementations in pure Pytorch.</figcaption>
 </figure>
 
@@ -181,7 +181,12 @@ streaming_dataset = StreamingLeRobotDataset(
 # Get the 100th frame in the dataset by 
 sample = dataset[100]
 print(sample)
-# 
+# {
+# 'observation.state': tensor([...]), 
+# 'action': tensor([...]), 
+# 'observation.images.wrist_camera': tensor([3, C, H, W]), for delta timesteps
+# ...
+# }
 
 batch_size=16
 # wrap the dataset in a DataLoader to use process it batches for training purposes
@@ -233,7 +238,7 @@ TL;DR Learning-based approaches to robotics are motivated by the need to (1) gen
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="generating-motion-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="generating-motion-atlas" style="position: absolute;"></span>
 <figcaption>Overview of methods to generate motion (clearly non-exhausitve, see @bekrisStateRobotMotion2024). The different methods can be grouped based on whether they explicitly (<em>dynamics-based</em>) or implicitly (<em>learning-based</em>) model robot-environment interactions.</figcaption>
 </figure>
 
@@ -251,7 +256,7 @@ Methods to produce robotics motion range from traditional *explicit* models--<sp
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotics-platforms-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotics-platforms-atlas" style="position: absolute;"></span>
 <figcaption>Different kinds of motions are achieved with potentially very different robotic platforms. From left to right, top to bottom: ViperX, SO-100, Boston Dynamics’ Spot, Open-Duck, 1X’s NEO, Boston Dynamics’ Atlas. This is an example list of robotic platforms and is (very) far from being exhaustive.</figcaption>
 </figure>
 
@@ -275,7 +280,7 @@ Recently, the development of low-cost manipulators like the ALOHA @zhaoLearning
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotic-platforms-costs" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotic-platforms-costs" style="position: absolute;"></span>
 <figcaption>Cheaper, more accessible robots are starting to rival traditional platforms like the Panda arm platforms in adoption in resource-constrained scenarios. The SO-100, in particular, has a cost in the 100s of Euros, and can be entirely 3D-printed in hours, while the industrially-manufactured Panda arm costs tens of thousands of Euros and is not openly available.</figcaption>
 </figure>
 
@@ -289,7 +294,7 @@ Deriving an intuition as per why learning-based approaches are gaining popularit
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="make-so100-planar-manipulator" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="make-so100-planar-manipulator" style="position: absolute;"></span>
 <figcaption>The SO-100 arm is a 6-dof manipulator arm. Preventing some of its joints (shoulder pane, wrist flex and wrist roll) from actuating, it can be represented as a traditional 2-dof planar manipulator (the gripper joint in the end-effector is not considered towards the count of the degrees of freedom used to produce motion).</figcaption>
 </figure>
 
@@ -308,7 +313,7 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulation-simple" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulation-simple" style="position: absolute;"></span>
 <figcaption>Free to move</figcaption>
 </figure>
 <figure>
@@ -319,7 +324,7 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulator-floor" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulator-floor" style="position: absolute;"></span>
 <figcaption>Constrained by the surface</figcaption>
 </figure>
 <figure>
@@ -330,25 +335,24 @@ All these simplifying assumptions leave us with the planar manipulator of Figure
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="planar-manipulator-floor-shelf" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="planar-manipulator-floor-shelf" style="position: absolute;"></span>
 <figcaption>Constrained by surface and (fixed) obstacle</figcaption>
 </figure>
 <figcaption>Planar, 2-dof schematic representation of the SO-100 manipulator under diverse deployment settings. From left to right: completely free of moving; constrained by the presence of the surface; constrained by the surface and presence of obstacles. Circular arrows around each joint indicate the maximal rotation feasible at that joint.</figcaption>
 </figure>
 
-Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $p \in \mathbb R^2$ as a function of the robot’s configuration, $p = p(q), p: \mathcal Q \mapsto \mathbb R^2$. In particular, we have: 
-
-$$
-`p(q) = \begin{pmatrix} p_x(\theta_1, \theta_2)\\ p_y(\theta_1, \theta_2) \end{pmatrix} = \begin{pmatrix} l \cos(\theta_1) + l \cos(\theta_1 + \theta_2)\\ l \sin(\theta_1) + l \sin(\theta_1 + \theta_2) \end{pmatrix} \in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}`
-$$
-
-
+Considering the (toy) example presented in Figure <a href="#planar-manipulation-simple" data-reference-type="ref" data-reference="planar-manipulation-simple">[planar-manipulation-simple]</a>, then we can analytically write the end-effector’s position $p \in \mathbb R^2$ as a function of the robot’s configuration, $p = p(q), p: \mathcal Q \mapsto \mathbb R^2$. In particular, we have: $p(q) = \begin{pmatrix} p_x(\theta_1, \theta_2) \\ p_y(\theta_1, \theta_2) \end{pmatrix} = \begin{pmatrix} l \cos(\theta_1) + l \cos(\theta_1 + \theta_2) \\ l \sin(\theta_1) + l \sin(\theta_1 + \theta_2) \end{pmatrix} \in S^{n=2}_{l_1+l_2} = \{ p(q) \in \mathbb R^2: \Vert p(q) \Vert_2^2 \leq (2l)^2, \ \forall q \in \mathcal Q \}$
 
 Deriving the end-effector’s *pose*--position *and* orientation--in some $m$-dimensional space $\boldsymbol{p} \in \mathcal{P} \subset \mathbb{R}^{m}$ starting from the configuration ${\textnormal{q}}\in \mathcal Q \subset \mathbb R^n$ of a $n$-joints robot is referred to as *forward kinematics* (FK), whereas identifying the configuration corresponding to any given target pose is termed *inverse kinematics* (IK). In that, FK is used to map a robot configuration into the corresponding end-effector pose, whereas IK is used to reconstruct the configuration(s) given an end-effector pose.
 
 In the simplified case here considered (for which $\boldsymbol{p} \equiv p$, as the orientation of the end-effector is disregarded for simplicity), one can solve the problem of controlling the end-effector’s location to reach a goal position $p^*$ by solving analytically for $q: p(q) = f_{\text{FK}}(q) = p^*$. However, in the general case, one might not be able to solve this problem analytically, and can typically resort to iterative optimization methods comparing candidate solutions using a loss function (in the simplest case, $\Vert p(q) - p^* \Vert_2^2$ is a natural candidate), yielding:
 
-$\htmlId{ik_problem}{\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .}$
+``` math
+\begin{align}
+\min_{q \in \mathcal Q} \Vert p(q) - p^* \Vert_2^2 \, .
+
+\end{align}
+```
 
 Exact analytical solutions to IK are even less appealing when one considers the presence of obstacles in the robot’s workspace, resulting in constraints on the possible values of $q \in \mathcal Q \subseteq [-\pi, +\pi]^n \subset \mathbb R^n$ in the general case of $n$-links robots.
 
@@ -356,7 +360,13 @@ For instance, the robot in Figure <a href="#planar-manipulator-floor" data-refe
 
 However, IK--solving eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> for a feasible $q$--only proves useful in determining information regarding the robot’s configuration in the goal pose, and crucially does not provide information on the *trajectory* to follow over time to reach a target pose. Expert-defined trajectories obviate to this problem providing a length-$K$ succession of goal poses $\tau_K = [p^*_0, p^*_1, \dots p^*_K]$ for tracking. In practice, trajectories can also be obtained automatically through *motion planning* algorithms, thus avoiding expensive trajectory definition from human experts. However, tracking $\tau_K$ via IK can prove prohibitively expensive, as tracking would require $K$ resolutions of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a> (one for each target pose). *Differential* inverse kinematics (diff-IK) complements IK via closed-form solution of a variant of eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>. Let $J(q)$ denote the Jacobian matrix of (partial) derivatives of the FK-function $f_\text{FK}- \mathcal Q \mapsto \mathcal P$, such that $J(q) = \frac{\partial f_{FK}(q)}{\partial q }$. Then, one can apply the chain rule to any $p(q) = f_{\text{FK}}(q)$, deriving $\dot p = J(q) \dot q$, and thus finally relating variations in the robot configurations to variations in pose, thereby providing a platform for control.
 
-Given a desired end-effector trajectory $\dot {p}^*(t)$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $\dot q(t)$ solving for joints’ *velocities* instead of *configurations*, $\htmlId{reg_ik_velocity}{\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2}$
+Given a desired end-effector trajectory $\dot {p}^*(t)$ (1) indicating anchor regions in space and (2) how much time to spend in each region, diff-IK finds $\dot q(t)$ solving for joints’ *velocities* instead of *configurations*,
+``` math
+\begin{align}
+\dot q(t) = \arg\min_\nu \; \lVert J(q(t)) \nu - \dot {p}^*(t) \rVert_2^2
+
+\end{align}
+```
 
 Unlike eq. <a href="#ik_problem" data-reference-type="ref" data-reference="ik_problem">[ik_problem]</a>, solving for $\dot q$ is much less dependent on the environment (typically, variations in velocity are constrained by physical limits on the actuators). Conveniently, eq. <a href="#reg_ik_velocity" data-reference-type="ref" data-reference="reg_ik_velocity">[reg_ik_velocity]</a> also often admits the closed-form solution $\dot q = J(q)^+ \dot {p}^*$, where $J^+(q)$ denotes the Moore-Penrose pseudo-inverse of $J(q)$. Finally, discrete-time joint configurations $q$ can be reconstructed from joint velocities $\dot q$ using forward-integration on the continuous-time joint velocity , $q_{t+1} = q_t + \Delta t\,\dot q_t$ for a given $\Delta t$, resulting in tracking via diff-IK.
 
@@ -401,7 +411,7 @@ Despite the last 60+ years of robotics research, autonomous robots are still lar
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="classical-limitations" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="classical-limitations" style="position: absolute;"></span>
 <figcaption>Dynamics-based approaches to robotics suffer from several limitations: (1) orchestrating multiple components poses integration challenges; (2) the need to develop custom processing pipelines for the sensing modalities and tasks considered hinders scalability; (3) simplified analytical models of physical phenomena (here friction at the gripper; credits to @antonovaReinforcementLearningPivoting2017) limit real-world performance. Lastly, (4) dynamics-based methods overlook trends in the availability and growth of robotics data.</figcaption>
 </figure>
 
@@ -438,7 +448,7 @@ TL;DR The need for expensive high-fidelity simulators can be obviated by learnin
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robot-learning-upsides" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robot-learning-upsides" style="position: absolute;"></span>
 <figcaption>Learning-based robotics streamlines perception-to-action by learning a (1) unified high-level controller capable to take (2) high-dimensional, unstructured sensorimotor information. Learning (3) does not require a dynamics model and instead focuses on interaction data, and (4) empirically correlates with the scale of the data used. </figcaption>
 </figure>
 
@@ -454,7 +464,7 @@ Being a field at its relative nascent stages, no prevalent technique(s) proved d
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robot-learning-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robot-learning-atlas" style="position: absolute;"></span>
 <figcaption>Overview of the robot learning methods implemented in <code>lerobot</code>.</figcaption>
 </figure>
 
@@ -470,7 +480,7 @@ Figure <a href="#robot-learning-atlas" data-reference-type="ref" data-reference
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="robotics-with-rl-examples" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="robotics-with-rl-examples" style="position: absolute;"></span>
 <figcaption>Examples of two different robotics tasks performed using RL. In the manipulation task (A) an agent learns to reach for a yellow plastic block in its environment, and to put it inside of a box. In the locomotion task (B) an agent learns to move its center of mass sideways without falling.</figcaption>
 </figure>
 
@@ -488,7 +498,7 @@ The RL framework @suttonReinforcementLearningIntroduction2018, which we briefly
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="rl-most-famous-pic" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="rl-most-famous-pic" style="position: absolute;"></span>
 <figcaption>Agent-Environment interaction diagram (image credits to @suttonReinforcementLearningIntroduction2018).</figcaption>
 </figure>
 
@@ -510,30 +520,35 @@ A length-$T$ *trajectory* is the (random) sequence
 ``` math
 \htmlId{trajectory_definition}{\tau = (s_0, a_0, r_0, s_1, a_1, r_1, \dots, s_{T-1}, a_{T-1}, r_{T-1}, s_T),}
 ```
-with per-step rewards defined as $r_t = r (s_t, a_t, s_{t+1})$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*: 
 
-$$
-`\htmlId{dynamics_markovian}{\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) = \mathbb P (s_{t+1}\vert s_t, a_t)\\ \mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) = \mathbb P(a_t\vert s_t)}`
-$$
+with per-step rewards defined as $r_t = r (s_t, a_t, s_{t+1})$ for ease of notation.Interestingly, assuming both the environment dynamics and conditional distribution over actions given states--the *policy*--to be *Markovian*:
 
- The probability of observing a given trajectory $\tau$ factorizes into
+``` math
+\begin{align}
+\mathbb P(s_{t+1}\vert s_t, a_t, s_{t-1}, a_{t-1}, \dots s_0, a_0 ) &= \mathbb P (s_{t+1}\vert s_t, a_t) \\
+\mathbb P(a_t\vert s_t, a_{t-1}, s_{t-1}, s_0, a_0) &= \mathbb P(a_t\vert s_t) 
+\end{align}
+```
+The probability of observing a given trajectory $\tau$ factorizes into
 ``` math
 \htmlId{traj_prob}{\mathbb P(\tau) = \mathbb P (s_0) \prod_{t=0}^{T-1} \mathbb P (s_{t+1}\vert s_t, a_t)\ \mathbb P(a_t\vert s_t).}
 ```
 
 Policies $\mathbb P(a_t\vert s_t)$ are typically indicated as $\pi(a_t\vert s_t)$, and often parametrized via $\theta$, yielding $\pi_\theta (a_t\vert s_t)$. Policies are trained optimizing the (discounted) *return* associated to a given $\tau$, i.e. the (random) sum of measured rewards over trajectory:
+
 ``` math
 G(\tau) = \sum_{t=0}^{T-1} \gamma^{t} r_t.
 ```
-In that, agents seek to learn control strategies (*policies*, $\pi_\theta$) maximizing the expected return $\mathbb E_{\tau \sim \pi_\theta} G(\tau)$. For a given dynamics $\mathcal D$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $\Pi$, yielding the (maximization) target $J : \Pi \mapsto \mathbb R$ 
-
-$$
-`\htmlId{RL-j-function}{J(\pi_\theta) = \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],\\ \mathbb P_{\theta; \mathcal D} (\tau) = \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).}`
-$$
-
-
+In that, agents seek to learn control strategies (*policies*, $\pi_\theta$) maximizing the expected return $\mathbb E_{\tau \sim \pi_\theta} G(\tau)$. For a given dynamics $\mathcal D$--i.e., for a given problem--taking the expectation over the (possibly random) trajectories resulting from acting according to a certain policy provides a direct, goal-conditioned ordering in the space of all the possible policies $\Pi$, yielding the (maximization) target $J : \Pi \mapsto \mathbb R$
+``` math
+\begin{align}
+    J(\pi_\theta) &= \mathbb E_{\tau \sim \mathbb P_{\theta; \mathcal D}} [G(\tau)],  \\
+    \mathbb P_{\theta; \mathcal D} (\tau) &= \rho \prod_{t=0}^{T-1} \mathcal D (s_t, a_t, s_{t+1})\ \pi_\theta (a_t\vert s_t).
+\end{align}
+```
 
 Because in the RL framework the agent is assumed to only be able to observe the environment dynamics and not to intervene on them, <a href="#RL-j-function" data-reference-type="ref" data-reference="RL-j-function">[RL-j-function]</a> varies exclusively with the policy followed. In turn, MDPs naturally provide a framework to optimize over the space of the possible behaviors an agent might enact ($\pi \in \Pi$), searching for the *optimal policy* $\pi^* = \arg \max_{\theta} J(\pi_\theta)$, where $\theta$ is the parametrization adopted by the policy set $\Pi: \pi_\theta \in \Pi, \ \forall \theta$. Other than providing a target for policy search, $G(\tau)$ can also be used as a target to discriminate between states and state-action pairs. Given any state $s \in \mathcal S$--e.g., a given configuration of the robot--the *state-value* function
+
 ``` math
 V_\pi(s) = \mathbb E_{\tau \sim \pi} [G(\tau) \big \vert s_0 = s]
 ```
@@ -541,13 +556,17 @@ can be used to discriminate between desirable and undesirable state in terms of
 ``` math
 Q_\pi(s,a) = \mathbb E_{\tau \sim \pi} [G (\tau) \big \vert s_0 = s, a_0=a]
 ```
-Crucially, value functions are interrelated: 
 
-$$
-`\htmlId{q-as-v}{Q_\pi(s_t, a_t) = \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]\\ V_\pi(s_t) = \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]}`
-$$
+Crucially, value functions are interrelated:
 
- Inducing an ordering over states and state-action pairs under $\pi$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
+``` math
+\begin{align}
+Q_\pi(s_t, a_t) &= \mathbb{E}_{s_{t+1}\sim \mathbb P(\bullet \vert s_t, a_t)} [r_t + \gamma V_\pi(s_{t+1})]  \\
+V_\pi(s_t) &= \mathbb E_{a_t\sim \pi(\bullet \vert s_t)} [Q_\pi (s_t, a_t)]
+
+\end{align}
+```
+Inducing an ordering over states and state-action pairs under $\pi$, value functions are central to most RL algorithms. A variety of methods have been developed in RL as standalone attemps to find (approximate) solutions to the problem of maximizing cumulative reward (Figure <a href="#rl-algos-atlas" data-reference-type="ref" data-reference="rl-algos-atlas">[rl-algos-atlas]</a>).
 
 <figure>
 <ResponsiveImage
@@ -557,7 +576,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="rl-algos-atlas" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="rl-algos-atlas" style="position: absolute;"></span>
 <figcaption>Popular RL algorithms. See @SpinningUp2018 for a complete list of citations.</figcaption>
 </figure>
 
@@ -579,7 +598,7 @@ Second, learning with a limited number of samples remains problematic in RL, <sp
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="synthetic-vs-real-duck" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="synthetic-vs-real-duck" style="position: absolute;"></span>
 <figcaption>Simulated (left) vs. real-world (right) OpenDuck. Discrepancies in the simulation dynamics (<em>reality gap</em>) pose risks to policy transfer.</figcaption>
 </figure>
 
@@ -593,7 +612,7 @@ Training RL policies in simulation @tobinDomainRandomizationTransferring2017 ad
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ducks-on-terrains" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ducks-on-terrains" style="position: absolute;"></span>
 <figcaption>The same locomotion task can be carried out in different (simulated) domains (exemplified by the difference in terrains) at training time, resulting to increased robustness over diverse environment dynamics.</figcaption>
 </figure>
 
@@ -628,25 +647,39 @@ Q_{i+1}(s_t, a_t) \leftarrow \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t
 ```
 Then, one can derive the (ideally, near-optimal) policy by explicitly maximizing over the action space the final (ideally, near-optimal) estimate $Q_K \approx Q^*$ at each timestep. In fact, under certain assumptions on the MDP considered, $Q_K \to Q^* \, \text{as } K \to \infty$.
 
-Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $\mathcal S\times \mathcal A$ problems, in which the storing of $Q : \mathcal S\times \mathcal A\mapsto \mathbb R$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $\theta$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $\delta_i$): 
-
-$$
-`\htmlId{dqn-loss}{\mathcal L(\theta_i) = \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} \big[ (\underbrace{y_i - Q_{\theta_i}(s_t, a_t)}_{\delta_i})^2 \big],\\ y_i = \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big],}`
-$$
-
- Where $\chi$ represents a behavior distribution over state-action pairs. Crucially, $\chi$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $(s_t, a_t, r_t, s_{t+1})$ transitions, used to form the TD-target $y_i$, TD-error $\delta_i$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
+Effective in its early applications to small-scale discrete problems and theoretically sound, vanilla Q-learning was found complicated to scale to large $\mathcal S\times \mathcal A$ problems, in which the storing of $Q : \mathcal S\times \mathcal A\mapsto \mathbb R$ alone might result prohibitive. Also, vanilla Q-learning is not directly usable for *continuous*, unstructured state-action space MPDs, such as those considered in robotics. In their seminal work on *Deep Q-Learning* (DQN), @mnihPlayingAtariDeep2013 propose learning Q-values using deep convolutional neural networks, thereby accomodating for large and even unstructured *state* spaces. DQN parametrizes the Q-function using a neural network with parameters $\theta$, updating the parameters by sequentially minimizing the expected squared temporal-difference error (TD-error, $\delta_i$):
+``` math
+\begin{align}
+\mathcal L(\theta_i) &= \mathbb E_{(s_t, a_t) \sim \chi(\bullet)} 
+    \big[ 
+        (\underbrace{y_i - Q_{\theta_i}(s_t, a_t)}_{\delta_i})^2 
+    \big],  \\
+    y_i &= \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma \max_{a_t\in \mathcal A} Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) \big], 
+\end{align}
+```
+Where $\chi$ represents a behavior distribution over state-action pairs. Crucially, $\chi$ can in principle be different from the policy being followed, effectively allowing to reuse prior data stored in a *replay buffer* in the form of $(s_t, a_t, r_t, s_{t+1})$ transitions, used to form the TD-target $y_i$, TD-error $\delta_i$ and loss function <a href="#dqn-loss" data-reference-type="ref" data-reference="dqn-loss">[dqn-loss]</a> via Monte-Carlo (MC) estimates.
 
 While effective in handling large, unstructured state spaces for discrete action-space problems, DQN application’s to continous control problems proved challenging. Indeed, in the case of high-capacity function approximators such as neural networks, solving $\max_{a_t \in \mathcal A} Q_\theta(s_t, a_t)$ at each timestep is simply unfeasible due to the (1) continous nature of the action space ($\mathcal A\subset \mathbb R^n$ for some $n$) and (2) impossibility to express the find a cheap (ideally, closed-form) solution to $Q_\theta$.  @silverDeterministicPolicyGradient2014 tackle this fundamental challenge by using a *deterministic* function of the state $s_t$ as policy, $\mu_\phi(s_t) = a_t$, parametrized by $\phi$. Thus, policies can be iteratively refined updating $\phi$ along the direction:
 ``` math
 \htmlId{deterministic-pg}{d_\phi = \mathbb E_{s_t \sim \mathbb P (\bullet)} [\nabla_\phi Q(s_t, a_t)\vert_{a_t = \mu_\phi(s_t)}] = \mathbb E_{s_t \sim \mathbb P(\bullet)} [\nabla_{a_t} Q(s_t, a_t) \vert_{a_t = \mu_\phi(s_t)} \cdot \nabla_\phi \mu(s_t)]}
 ```
+
 Provably, <a href="#deterministic-pg" data-reference-type="ref" data-reference="deterministic-pg">[deterministic-pg]</a> is the *deterministic policy gradient* (DPG) of the policy $\mu_\phi$ @silverDeterministicPolicyGradient2014, so that updates $\phi_{k+1}\leftarrow \phi_k + \alpha d_\phi$ are guaranteed to increase the (deterministic) cumulative discounted reward, $J(\mu_\phi)$.  @lillicrapContinuousControlDeep2019 extended DPG to the case of (1) high-dimensional unstructured observations and (2) continuous action spaces, introducing Deep Deterministic Policy Gradient (DDPG), an important algorithm RL and its applications to robotics. DDPG adopts a modified TD-target compared to the one defined in <a href="#TD-target" data-reference-type="ref" data-reference="TD-target">[TD-target]</a>, by maintaining a policy network used to select actions, yielding
+
 ``` math
 \htmlId{TD-target-ddpg}{y_i = \mathbb E_{s_{t+1} \sim \mathbb P(\bullet \vert s_t, a_t)} \big[ r_t + \gamma Q_{\theta_{i-1}} (s_{t+1}, \mu_\phi(s_{t+1})) \big] .}
 ```
 Similarily to DQN, DDPG also employs the same replay buffer mechanism, to reuse past transitions over training for increased sample efficiency and estimate the loss function via MC-estimates.
 
-Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with <span class="highlight">maximizing the discounted cumulative reward, while acting as randomly as possible</span>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $J (\pi)$ to specifically account for the policy entropy, $\htmlId{J-soft}{J(\pi) = \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))]}$ This modified objective results in the *soft* TD-target:
+Soft Actor-Critic (SAC) @haarnojaSoftActorCriticOffPolicy2018 is a derivation of DDPG in the max-entropy (MaxEnt) RL framework, in which RL agents are tasked with <span class="highlight">maximizing the discounted cumulative reward, while acting as randomly as possible</span>. MaxEnt RL @haarnojaReinforcementLearningDeep2017 has proven particularly robust thanks to the development of diverse behaviors, incentivized by its entropy-regularization formulation. In that, MaxEnt revisits the RL objective $J (\pi)$ to specifically account for the policy entropy,
+``` math
+\begin{align}
+    J(\pi) &= \sum_{t=0}^T \mathbb{E}_{(s_t, a_t) \sim \chi} [r_t + \alpha \mathcal H(\pi (\bullet \vert s_t))] 
+\end{align}
+```
+
+This modified objective results in the *soft* TD-target:
+
 ``` math
 \htmlId{soft-td-target}{y_i = \mathbb E_{s_{t+1} \sim \mathbb P( \bullet \vert s_t, a_t)} [r_t + \gamma \left( Q_{\theta_{i-1}} (s_{t+1}, a_{t+1}) - \alpha \log \pi_\phi(a_{t+1} \vert s_{t+1}) \right)], \quad a_{t+1} \sim \pi_\phi(\bullet \vert s_t)}
 ```
@@ -676,7 +709,7 @@ Lastly, in order to improve on the robustness of their approach to different goa
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="hil-serl-blocks" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="hil-serl-blocks" style="position: absolute;"></span>
 <figcaption>(A) HIL-SERL allows for real-world training of high performance RL agents by building on top advancements presented by of SAC, RLPD and SERL. (B) Example of human intervention during a HIL-SERL training process on a SO-100.</figcaption>
 </figure>
 
@@ -721,7 +754,7 @@ TL;DR Behavioral Cloning provides a natural platform to learn from real-world in
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-bc-trajectories" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-bc-trajectories" style="position: absolute;"></span>
 <figcaption>(A) Average (with standard deviation) evolution of the actuation levels over the first 5 recorded episodes in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Proprioperceptive state provide invaluable to determine the robot’s state during an episode. (B) Camera frames are also recorded alongside measurements on the robot’s state, capturing information about the robot’s interaction with its environment.</figcaption>
 </figure>
 
@@ -737,7 +770,7 @@ Formally, let $\mathcal D = \{ \tau^{(i)} \}_{i=1}^N$ be a set of expert traject
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-observation-action-mapping" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-observation-action-mapping" style="position: absolute;"></span>
 <figcaption>Sample observations and action pairs over the course of a given trajectory recorded in <a href="lerobot/svla_so101_pickplace" class="uri">lerobot/svla_so101_pickplace</a>. Observations, comprising of both proprioperceptive and visual information, are recorded alongside the configuration of a second, leader robot controlled by a human expert, providing complete information for regressing actions given observation.</figcaption>
 </figure>
 
@@ -759,7 +792,7 @@ Despite the inherent challenges of learning on non-i.i.d. data, the BC formulati
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-issues-with-bc" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-issues-with-bc" style="position: absolute;"></span>
 <figcaption>Point-wise policies suffer from limitations due to (A) covariate shifts and poor approximation of (B) multimodal demonstrations. (A) Initially small errors may drive the policy out of distribution, incuring in a vicious circle ultimately resulting in failure. (B) Both modes of reaching for a target object in a scene, either left or right-first, are equally as good and thus equally as likely to be present in a dataset of human demonstrations, ultimately resulting in multimodal demonstrations.</figcaption>
 </figure>
 
@@ -779,7 +812,7 @@ Generative Models (GMs) aim to learn the stochastic process underlying the very
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-task-effect-on-pairs" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-task-effect-on-pairs" style="position: absolute;"></span>
 <figcaption>Intuitively, latent variable in a single latent model may contain information regarding the task being performed, which directly results in the likelihood of the same observation-action pair being different for two different tasks. When (A) picking a block the likelihood of a wide gripper’s opening should be higher than narrower one, while it should be the opposite when (B) pushing the block.</figcaption>
 </figure>
 
@@ -797,41 +830,64 @@ Intuitively, in the case of observation-action pairs $(o, a)$ for a robotics app
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-latent-variable-model" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-latent-variable-model" style="position: absolute;"></span>
 <figcaption>(A) The latent variable model in a robotics application regulates influence between observed (<span class="math inline"> <em>o</em>, <em>a</em>)</span> variables and an unobservable latent variable. (B) VAEs approximate exact latent variable models by means of variational inference.</figcaption>
 </figure>
 
-Given a dataset $\mathcal D$ consisting of $N$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $\theta$ (in Bayesian terms, the *evidence* $p_\theta(\mathcal D)$) can thus be written as: 
-
-$$
-`\htmlId{evidence-definition-1}{\log p_\theta(\mathcal D) = \log \sum_{i=0}^N p_\theta ((o,a)_i)\\ = \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z)\\ = \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z)\\ = \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)],}`
-$$
-
- where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
+Given a dataset $\mathcal D$ consisting of $N$ i.i.d. observation-action pairs, the log-likelihood of all datapoints under $\theta$ (in Bayesian terms, the *evidence* $p_\theta(\mathcal D)$) can thus be written as:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &= \log \sum_{i=0}^N p_\theta ((o,a)_i) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \int_{\text{supp}({Z})} \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z) p(z) \\
+                              &= \log \sum_{i=0}^N \mathbb E_{z \sim p_\theta(\bullet \vert (o,a)_i)} [\frac{p(z)}{q_\theta(z \vert (o,a)_i)} \cdot p_\theta((o,a)_i \vert z)], 
+\end{align}
+```
+where we used <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a> in <a href="#evidence-definition-1" data-reference-type="ref" data-reference="evidence-definition-1">[evidence-definition-1]</a>, multiplied by $1 = \frac{q_\theta(z \vert (o,a)_i)}{q_\theta(z \vert (o,a)_i)}$ in <a href="#evidence-definition-2" data-reference-type="ref" data-reference="evidence-definition-2">[evidence-definition-2]</a>, and used the definition of expected value in <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a>.
 
 In the special case where one assumes distributions to be tractable, $p_\theta (\mathcal D)$ is typically tractable too, and $\max_\theta \log p_\theta(\mathcal D)$ provides a natural target for (point-wise) infering the unknown parameters $\theta$ of the generative model. Unfortunately, <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> is rarely tractable when the distribution $p$ is modeled with approximators such as neural networks, especially for high-dimensional, unstructured data.
 
 In their seminal work on Variational Auto-Encoders (VAEs), @kingmaAutoEncodingVariationalBayes2022 present two major contributions to learn complex latent-variable GMs on unstructured data, proposing (1) a tractable, variational lower-bound to <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> as an optimization target to jointly learn likelihood and posterior and (2) high-capacity function approximators to model the likelihood $p_\theta(o,a\vert z)$ and (approximate) posterior distribution $q_\phi(z \vert o,a) \approx q_\theta(z \vert o,a)$.
 
-In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]$--yielding: 
+In particular, the lower bound on <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> (Evidence LOwer Bound, *ELBO*) can be derived from <a href="#evidence-definition" data-reference-type="ref" data-reference="evidence-definition">[evidence-definition]</a> applying Jensen’s inequality--$\log \mathbb{E}[\bullet] \geq \mathbb{E} [\log (\bullet)]$--yielding:
+``` math
+\begin{align}
+    \log p_\theta(\mathcal D) &\geq \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+            + \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} [\log \left( \frac{p(z)}{q_\theta(z \vert (o,a)_i)} \right)]
+        \right) \\
+        &= \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+        - \text{D}_{\text{KL}}\big[ q_\theta(z \vert (o,a)_i) \Vert p(z) \big]
+        \right) 
+\end{align}
+```
 
-$$
-`\htmlId{ELBO-intractable}{\log p_\theta(\mathcal D) \geq \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] + \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} [\log \left( \frac{p(z)}{q_\theta(z \vert (o,a)_i)} \right)] \right)\\ = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim p_\theta(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] - \text{D}_{\text{KL}}\big[ q_\theta(z \vert (o,a)_i) \Vert p(z) \big] \right)}`
-$$
+The true, generally intractable posterior $p_\theta (z \vert o,a)$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $q_\phi(z \vert o,a)$, resulting in the final, tractable ELBO objective,
 
- The true, generally intractable posterior $p_\theta (z \vert o,a)$ prevents computing both the expectation and KL divergence terms in <a href="#ELBO-intractable" data-reference-type="ref" data-reference="ELBO-intractable">[ELBO-intractable]</a>, and therefore @kingmaAutoEncodingVariationalBayes2022 propose deriving the ELBO using an *approximate* posterior $q_\phi(z \vert o,a)$, resulting in the final, tractable ELBO objective, $\htmlId{ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim q_\phi(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big] - \text{D}_{\text{KL}}\big[ q_\phi(z \vert (o,a)_i) \Vert p(z) \big] \right)}$ From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $q_\phi$ as a Gaussian $q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)$ and (2) imposing a standard Gaussian prior on the latent space, $p(z) = \mathcal N(\mathbf{0}, \mathbf{I})$.
+``` math
+\begin{align}
+\text{ELBO}_{\mathcal D}(\theta, \phi) = \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim q_\phi(\cdot \vert (o,a)_i)} \big[ \log p_\theta((o,a)_i \vert z) \big]
+        - \text{D}_{\text{KL}}\big[ q_\phi(z \vert (o,a)_i) \Vert p(z) \big]
+        \right)
+        
+\end{align}
+```
+From Jensen’s inequality, maximizing ELBO results in maximizing the log-likelihood of the data too, thus providing a natural, tractable optimization target. Indeed, expectations can be estimated using MC estimates from the learned distributions in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, while the KL-divergence term can typically be computed in closed-form (1) modeling $q_\phi$ as a Gaussian $q_\phi(z \vert o,a) = \mathcal N\big(\mu_\phi(o,a), \Sigma_\phi(o,a) \big)$ and (2) imposing a standard Gaussian prior on the latent space, $p(z) = \mathcal N(\mathbf{0}, \mathbf{I})$.
 
 An intuitive explanation of the learning dynamics of VAEs can be given considering the equivalent case of *minimizing the negative ELBO*, which admits a particularly interpretable factorization
 
-
-
-$$
-`\htmlId{VAE-min-neg-ELBO}{\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) = \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi)\\ \mathbf{L^{\text{rec}}}(\theta) = \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]\\ \mathbf{L^{\text{reg}}}(\phi) = \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big]}`
-$$
-
-
+``` math
+\begin{align}
+\min_{\theta, \phi} - \text{ELBO}_{\mathcal (o,a) \sim \mathcal D}(\theta, \phi) &= \min_{\theta, \phi}\mathbf{L^{\text{rec}}}(\theta) + \mathbf{L^{\text{reg}}}(\phi) \\
+\mathbf{L^{\text{rec}}}(\theta) &= \mathbb{E}_{z \sim q_\phi(\cdot \vert o,a} \big[ \log p_\theta(o,a \vert z) \big]  \\
+\mathbf{L^{\text{reg}}}(\phi) &= \text{D}_{\text{KL}}\big[ q_\phi(z \vert o,a) \Vert p(z) \big] 
+\end{align}
+```
 
 For any given $(o,a)$ pair, the expected value term of <a href="#VAE-Lrec" data-reference-type="ref" data-reference="VAE-Lrec">[VAE-Lrec]</a> is typically computed via MC estimates, resulting in
+
 ``` math
 -\mathbb{E}_{z \sim q_\phi(\bullet \vert o,a)} \big[ \log p_\theta(o,a \vert z) \big] = \mathbf{L^{\text{rec}}} \approx - \frac{1}{n} \sum_{i=0}^n \log p_\theta(o,a \vert z_i).
 ```
@@ -843,13 +899,14 @@ Indeed, it is very common in practice to approximate from the learned likelihood
 
 #### Diffusion Models
 
-VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $p_\theta$ and (approximate) posterior $q_\phi$ for such model. In that, the unknown data distribution $p(o,a)$ is effectively approximated via $\int_Z p(z) p_\theta(o,a \vert z)$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $p(o,a)$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $o,a$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in 
-
-$$
-`\htmlId{BC-multi-latent-model-1}{p(\underbrace{o,a}_{= z_0}) = \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)\\ p(z_0, z_1, \dots z_T) = p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t),}`
-$$
-
- where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
+VAEs approximate probability distributions via a *single* latent variable model, assuming the underlying unknown distribution can be factored according to <a href="#BC-latent-variable" data-reference-type="ref" data-reference="BC-latent-variable">[BC-latent-variable]</a>, and solve the variational inference problem of jointly learning the likelihood $p_\theta$ and (approximate) posterior $q_\phi$ for such model. In that, the unknown data distribution $p(o,a)$ is effectively approximated via $\int_Z p(z) p_\theta(o,a \vert z)$, and the underlying generative process reproduced by (1) sampling a latent variable and (2) learning to decode it into a (ideally) high-likelihood sample under the (unknown) $p(o,a)$. Diffusion Models (DMs) @hoDenoisingDiffusionProbabilistic2020 are another class of GMs which treat the similar problem of approximating an underlying unknown data distribution--*variational inference*--by *partially* extending VAEs to the case where *multiple* latent variables influence each other and the generative process underlying $o,a$ itself. In particular, DMs posit the generative process can be decomposed to a series of piece-wise (Markovian) interactions between (latent) variables (Figure <a href="#ch4-many-latents" data-reference-type="ref" data-reference="ch4-many-latents">[ch4-many-latents]</a>), resulting in
+``` math
+\begin{align}
+    p(\underbrace{o,a}_{= z_0}) &= \int_{\text{supp}({Z_0})} \int_{\text{supp}({Z_1})} \ldots \int_{\text{supp}({Z_T})} p(z_0, z_1, \dots z_T)  \\ 
+    p(z_0, z_1, \dots z_T) &= p(z_T) \prod_{t=0}^{T} p(z_{t-1} \vert z_t), 
+\end{align}
+```
+where we explicitly showed the marginalization over the multiple latents in <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>, and used the law of conditional probability and Markov property in <a href="#BC-multi-latent-model-2" data-reference-type="ref" data-reference="BC-multi-latent-model-2">[BC-multi-latent-model-2]</a>.
 
 <figure>
 <ResponsiveImage
@@ -859,7 +916,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-many-latents" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-many-latents" style="position: absolute;"></span>
 <figcaption>HMLV models posit the data generation process is influenced by a stack of Markov-dependent latent variables, with samples from the posterior distribution being progressively higher up in the hierarchy.</figcaption>
 </figure>
 
@@ -867,13 +924,16 @@ Similarily to VAEs, providing an exact interpretation for the latent variables i
 
 Just like VAEs, DMs attemp to learn to reproduce an underlying data distribution $p (o,a)$ given a collection of i.i.d. samples approximating the model posited to have generated the data in the first place ( <a href="#BC-multi-latent-model-1" data-reference-type="ref" data-reference="BC-multi-latent-model-1">[BC-multi-latent-model-1]</a>). Similarily to VAEs, DMs approximate the process of sampling from the unknown $p(o,a)$ (1) sampling from an easy-to-sample distribution (e.g., Gaussian) and (2) learning to reconstruct high-likelihood samples under the unknown distribution. However, in stark contrast with VAEs, the easy-to-sample distribution contains *no mutual information* regarding the data distribution $p(o,a)$. Crucially, as no information from the sample $(o,a)$ (denoted as $z_0 \equiv (o,a)$ for the sake of notation) is assumed to be propagated throughout the chain of latents, the posterior $q(z_t \vert z_{t-1})$ assumes a relatively amicable structure in DMs, reducing complexity. The *true* likelihood $p(z_{t-1} \vert z_t)$ is instead typically approximated using the parametrization $p_\theta (z_{t-1} \vert z_t)$. In that, the information contained in the unknwon data distribution is *reconstructed* via a process in which samples from a fixed distribution are turned into (ideally) high-likelihood samples under $p(o,a)$--a process referred to as *denoising*.
 
-Under such model, we can express the log-likelihood of an arbitrary sample as[^4] 
-
-$$
-`\htmlId{diffusion-likelihood}{\log p_\theta (\underbrace{o,a}_{= z_0}) = \mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -\\ \mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag\\ \sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag}`
-$$
-
- providing an optimization target in the form of $\max_\theta \log p_\theta (\mathcal D)$.
+Under such model, we can express the log-likelihood of an arbitrary sample as[^4]
+``` math
+\begin{align}
+    \log p_\theta (\underbrace{o,a}_{= z_0}) = 
+    &\mathbb{E}_{z_1 \sim q(\bullet \vert z_0)} \log p_\theta (z_0 \vert z_1) -  \\
+    &\mathbb{E}_{z_{T-1} \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_T \vert z_{T-1}) \Vert p(z_T) ) \big] - \notag \\ 
+    &\sum_{t=1}^{T-1} \mathbb{E}_{(z_{t-1}, z_{t+1}) \sim q(\bullet \vert z_0)} \big[ \text{D}_{\text{KL}}(q(z_t \vert z_{t-1}) \Vert p_\theta(z_t \vert z_{t-1}) ) \big], \notag
+\end{align}
+```
+providing an optimization target in the form of $\max_\theta \log p_\theta (\mathcal D)$.
 
 In their seminal work on using DMs for variational inference, @hoDenoisingDiffusionProbabilistic2020 introduce major contributions regarding solving $\min_\theta -\log p_\theta(o,a)$. In particular, @hoDenoisingDiffusionProbabilistic2020 exclusively adopt a fixed *Gaussian* posterior in the form of $q(z_t \vert z_{t-1}) = \mathcal{N}(\sqrt{1-\beta_t}z_{t-1}, \beta_t \mathbf I)$. The choice of adopting Gaussians has profound implications on the generative process modeled. Indeed, under the (mild) assumption that the variance is sufficiently small $\beta_t \leq \eta, \eta \in \mathbb R^+$, @sohl-dicksteinDeepUnsupervisedLearning2015 proved that the likelihood $p(z_{t-1} \vert z_t)$ is Gaussian as well, which allows for the particularly convenient parametrization of the approximate likelihood $p_\theta (x_{t-1} \vert x_t) = \mathcal N(\mu_\theta(x_t, t), \Sigma_\theta(x_t,t)), \ t \in [1,T]$, as well as for closed-form tractability of the KL-divergence terms in <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a>. Further, the posterior’s structure also enables an analytical description for the distribution of the $t$-th latent variable, $q(z_t \vert z_0) = \mathcal N (\sqrt{\bar{\alpha}_t}z_0, (1-\bar{\alpha}_t) \mathbf{I})$, with $\alpha_t = 1-\beta_t, \ \bar \alpha_t = \prod_{k=1}^t \alpha_k$, which conveniently prevents iterative posterior sampling.
 
@@ -885,7 +945,7 @@ In their seminal work on using DMs for variational inference, @hoDenoisingDiffu
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="diffusion-robot-actions" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="diffusion-robot-actions" style="position: absolute;"></span>
 <figcaption>DMs iteratively corrupt samples (left) from an unknown distribution into a quasi-standard Gaussian (center), learning the displacement field (right) that permits to reconstruct samples from the unknown target distribution by iteratively denoising samples of a tractable, easy-to-sample distribution.</figcaption>
 </figure>
 
@@ -899,29 +959,45 @@ Finally, adopting Gaussian posteriors permits a particularly pleasing interpreta
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-action-vs-observation-distribution" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-action-vs-observation-distribution" style="position: absolute;"></span>
 <figcaption>A joint action-observation distribution, in the simplified case where the observation is the elbow-flex actuation in a SO-100, and the action is the recorded position for the same joint in the teleoperator arm. The motion recorded being teleoperated, the points distribute along a the diagonal.</figcaption>
 </figure>
 
-Because the recorded behavior is teleoperated, measurements mostly distribute along the line $a = o + \eta, \eta \sim N(0,1)$, with $\eta$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $\mathcal O\times \mathcal A$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective: $\htmlId{diffusion-simplified-loss}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[ \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} z_0 + \epsilon \sqrt{1 - \bar \alpha_t}, t) \Vert^2 \big], \quad t \sim \mathcal{U}(\{1,\dots,T\}), \quad z_0 \sim \mathcal{D}, \quad \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).}$
+Because the recorded behavior is teleoperated, measurements mostly distribute along the line $a = o + \eta, \eta \sim N(0,1)$, with $\eta$-variability accouting for minor control inconsistencies (Figure <a href="#ch4-action-vs-observation-distribution" data-reference-type="ref" data-reference="ch4-action-vs-observation-distribution">[ch4-action-vs-observation-distribution]</a>). Using Gaussian posteriors--i.e., adding Gaussian noise--effectively simulates a *Brownian motion* for the elements in the distribution’s support (in Figure <a href="#diffusion-robot-actions" data-reference-type="ref" data-reference="diffusion-robot-actions">[diffusion-robot-actions]</a>, $\mathcal O\times \mathcal A$), whereby information *diffuses away* from the samples, and comparing the diffused samples to the original data points one can derive an estimate of the total displacement induced by diffusion. Under the only assumption that the likelihood of the diffused samples is low under the original unknown data distribution, then one can effectively approximate the unkwown distribution by learning to *reverse* such displacement. This key intuition allows to write a simplified training objective:
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, \epsilon} \big[
+        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} z_0 + \epsilon \sqrt{1 - \bar \alpha_t}, t) \Vert^2 \big], \quad t \sim \mathcal{U}(\{1,\dots,T\}), \quad
+        z_0 \sim \mathcal{D}, \quad
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}).
+\end{align}
+```
 
 In this simplified (minimization) objective, the optimization process differs from <a href="#diffusion-likelihood" data-reference-type="ref" data-reference="diffusion-likelihood">[diffusion-likelihood]</a> in that, rather than maxizing $p_\theta$ directly, the parameters $\theta$ of the pairwise likelihood $p_\theta(z_{t-1} \vert z_t)$ are adjusted to *predict the total displacement* $\epsilon$ for a randomly long ($t \sim \mathcal{U}(\{1,\dots,T\}$ )) diffusion process starting from a sample of the target distribution.
 
-By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($\Vert \epsilon \Vert > 0$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $p_\theta (z_{t-1} \vert z_t)$ is Gaussian, then sampling $z_{t-1} \sim p_\theta(\bullet \vert z_{t})$ corresponds to computing $\htmlId{diffusion-denoising-definition}{z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}),}$ thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $\epsilon_\theta(z_t, t)$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
+By learning the total displacement from a generally, uninformative corrupted sample obtained diffusing information and a sample from an unknown distribution--significant ($\Vert \epsilon \Vert > 0$) whenever input and target distribution are sufficiently different-- @hoDenoisingDiffusionProbabilistic2020 show that one can approximate the underlying distribution reversing the displacement, *denoising* samples. Interestingly, under the hypothesis real-world data belongs to a single higher dimensional manifold (Manifold Hypothesis), @permenterInterpretingImprovingDiffusion2024 show that diffusion learns the gradient of a distance function from any off-point manifold (such as perturbed, uniformative samples), and the data manifold itself. Following this gradient--i.e., denoising a sample from an uninformative distribution--corresponds to projecting back into the manifold, yielding a procedure to sample from unknown distributions by means of Euclidean projection. Indeed, under the assumption that $p_\theta (z_{t-1} \vert z_t)$ is Gaussian, then sampling $z_{t-1} \sim p_\theta(\bullet \vert z_{t})$ corresponds to computing
+``` math
+\begin{align}
+    z_{t-1} = \frac{1}{\sqrt{\alpha_t}} \left( z_t - \frac{\beta_t}{\sqrt{1 - \bar\alpha_t}} \epsilon_\theta(z_t, t) \right) + \sigma_t \epsilon, \quad \epsilon \sim \mathcal N(\mathbf{0}, \mathbf{I}), 
+\end{align}
+```
+thus showing that the lower-level latent variables in a DM can be obtained by iteratively removing noise from the one-step higher order variable, using the noise regressor $\epsilon_\theta(z_t, t)$ learned minimizing <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>.
 
 #### Flow Matching
 
 <span id="ch4-flow-matching" style="position: absolute;"></span>
 
-The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $\psi [0,1] \times Z \mapsto Z$, formalized starting from possibly time-dependent vector field $v: [0,1] \times Z \mapsto Z$ transporting samples from a simple prior distribution $p_0$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $p_1$ over time. Note how FM models time $t \in [0,1]$ to be varying continuously while moving away *from* an easy-to-sample distribution $p_0$ *towards* the unknown data-distribution, $p_1$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time, 
-
-$$
-`\frac{d}{dt} \psi(z, t) = v(t, \psi(t, z))\\ \psi(0, z) = z`
-$$
-
-
+The posterior parametrization adopted by DMs proved traditionally effective, yet it raised concerns circa its efficiency at inference time, where a possibly large of compute-expensive denoising steps are needed in order to recover a sample from the target distribution. Flow Matching (FM) @lipmanFlowMatchingGenerative2023 extends DMs to the general case of arbitrary, parametrized likelihood and posteriors, and in this defines a superseding class of GMs providing a unified framework for learning *continuous transformations* between distributions, encompassing and generalizing DMs. Instead of a *stochastic, discrete, multi-step* denoising process, FM aims to learn a *deterministic, continuous, differentiable flow* $\psi [0,1] \times Z \mapsto Z$, formalized starting from possibly time-dependent vector field $v: [0,1] \times Z \mapsto Z$ transporting samples from a simple prior distribution $p_0$--e.g., a standard Gaussian--to a more complex, potentially unknown data distribution $p_1$ over time. Note how FM models time $t \in [0,1]$ to be varying continuously while moving away *from* an easy-to-sample distribution $p_0$ *towards* the unknown data-distribution, $p_1$. This results in a continuous and deterministic trajectory for each sample, which can be more efficient to generate compared to the stochastic paths of DMs. Formally, FM can be fully characterized by an ordinary differential equation (ODE) relating instantaneous variations of flows with the underlying vector field, and hence providing complete trajectories over the distributions’ support when integrating over time,
+``` math
+\begin{align}
+    \frac{d}{dt} \psi(z, t) &= v(t, \psi(t, z)) \\
+    \psi(0, z) &= z
+\end{align}
+```
 
 FM proved very effective in a variety of applications, ranging from image @esserScalingRectifiedFlow2024 and video generation @polyakMovieGenCast2025 to robotics control @blackp0VisionLanguageActionFlow2024. Most notably, in their introductory work on FM for GM, @lipmanFlowMatchingGenerative2023 show how DMs can be seen as a specific instance of FM where the *conditional* target vector field $u$ approximated by the noise regressor corresponds to
+
 ``` math
 \htmlId{fm-diffusion-vector-field}{u(t, z\vert z_0) = \frac{\frac{d}{dt}\alpha(1-t)}{1 - (\alpha(1-t))^2}(\alpha(1-t)z - z_0), \quad \alpha(t) = e^{-\frac12 \int_0^t \beta(s) ds}, \quad \forall z_0 \in \mathcal D}
 ```
@@ -935,7 +1011,7 @@ Note that the traditional discrete-time noise-scheduler ${\beta_t}_{t=0}^T$ is n
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-normalizing-flows" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-normalizing-flows" style="position: absolute;"></span>
 <figcaption>Probability distributions can be modified applying vector fields resulting in a flow of mass in the support. When acting over time, vector fields can effectively change the distribution’s structure.</figcaption>
 </figure>
 
@@ -949,11 +1025,19 @@ While the noising schedule of DMs results in a stochastic process that resembles
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-diffusion-paths-versus-fm" style="position- absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-diffusion-paths-versus-fm" style="position: absolute;"></span>
 <figcaption>Compared to diffusion, flow matching distorts distribution along a less randomic pattern, resulting in a clearer interpolation between source and target distribution. The visualization shows an example comparison between these two methods on joint distribution of robot observations and actions over <span class="math inline"> <em>T</em> = 50</span> steps.</figcaption>
 </figure>
 
-In practice, FM can be applied to generative modeling by learning a vector field regressor $v_\theta(z, t)$ to approximate a given target vector field $u(t, z)$. In the particular case of DMs, $u(t, z)$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $z_1 \sim p_1$ and a sample from an easy-to-sample prior $z_0 \sim p_0$, CFM defines a simple path between them using *linear interpolation* between samples $z_t = (1-t)z_0 + t z_1$, resulting in the target vector field $u(t, z_t) = z_1 - z_0$. Then, a FM model can be trained with the simple regression objective defined as $\htmlId{flow-matching-objective}{\mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[ \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),}$ where $z_0 \sim p_0(\bullet)$ and $z_1 \sim p_1(\bullet)$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $t \sim \mathcal U([0,1])$ rather than discretely $t \sim \mathcal U(\{0,1\})$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $z_0 \sim p_0$ and iteratively refined according to $\frac{dz}{dt} = v_\theta(z_t, t)$ for $t \in [0,1]$--an operation that can be numerically carried out with standard ODE solvers.
+In practice, FM can be applied to generative modeling by learning a vector field regressor $v_\theta(z, t)$ to approximate a given target vector field $u(t, z)$. In the particular case of DMs, $u(t, z)$ is defined as in <a href="#fm-diffusion-vector-field" data-reference-type="ref" data-reference="fm-diffusion-vector-field">[fm-diffusion-vector-field]</a>, while in priciple the target vector field can be learned to induce a particular transportation, or fixed according to OT. Given a sample from the data distribution $z_1 \sim p_1$ and a sample from an easy-to-sample prior $z_0 \sim p_0$, CFM defines a simple path between them using *linear interpolation* between samples $z_t = (1-t)z_0 + t z_1$, resulting in the target vector field $u(t, z_t) = z_1 - z_0$. Then, a FM model can be trained with the simple regression objective defined as
+``` math
+\begin{align}
+
+    \mathcal L(\theta) = \mathbb{E}_{t, z_0, z_1} \big[
+        \Vert v_\theta((1-t)z_0 + t z_1, t) - (z_1 - z_0) \Vert^2 \big], \quad t \sim \mathcal{U}([0,1]),
+\end{align}
+```
+where $z_0 \sim p_0(\bullet)$ and $z_1 \sim p_1(\bullet)$. Note how in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a>--differently from <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a>--time is assumed to be varying continuously $t \sim \mathcal U([0,1])$ rather than discretely $t \sim \mathcal U(\{0,1\})$, a key property of flow-based models. The objective in <a href="#flow-matching-objective" data-reference-type="ref" data-reference="flow-matching-objective">[flow-matching-objective]</a> directly regresses the learned vector field onto the simple, straight path connecting a point from the prior and a point from the data, providing a simulation-free training procedure that is both stable and efficient. At inference time, samples are generated by starting with $z_0 \sim p_0$ and iteratively refined according to $\frac{dz}{dt} = v_\theta(z_t, t)$ for $t \in [0,1]$--an operation that can be numerically carried out with standard ODE solvers.
 
 ### Action Chunking with Transformers
 
@@ -961,7 +1045,17 @@ While GMs prove useful in learning complex, high-dimensional multi-modal distrib
 
 On the robot learning side of their contributions, @zhaoLearningFineGrainedBimanual2023 adopt transformers as the architectural backbone to learn a *Conditional* VAE @sohnLearningStructuredOutput2015. Conditional VAEs are a variation of the more standard VAE formulation introducing a conditioning variable on sampling from the latent prior, allowing the modeling of *one-to-many* relationships between latent and data samples. Further, in stark contrast with previous work @florenceImplicitBehavioralCloning2022, @jannerPlanningDiffusionFlexible2022, @zhaoLearningFineGrainedBimanual2023 do not learn a full joint $p_\theta(o,a)$ on observation and actions. While the *policy* distribution $p_\theta(a \vert o)$ can in principle be entirely described from its joint $p_\theta(o,a)$, it is often the case that the conditional distribution is intractable when using function approximators, as $p_\theta(a \vert o) = \tfrac{p_\theta(o,a)}{\int_\mathcal Ap_\theta(o,a)}$ and the integral in the denominator is typically intractable. Instead of modeling the full joint using a vanilla VAE, @zhaoLearningFineGrainedBimanual2023 propose learning a *conditional* VAE @sohnLearningStructuredOutput2015 modeling the policy distribution directly $p (a \vert o)$.
 
-In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to $\htmlId{c-ELBO}{\text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left( \mathbb{E}_{z \sim q_\phi(\cdot \vert o_i, a_i)} \big[ \log p_\theta(a_i \vert z, o_i) \big] - \text{D}_{\text{KL}}\big[ q_\phi(z \vert o_i, a_i) \Vert p_\omega(z \vert o_i) \big] \right)}$ Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $\omega$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $\beta$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $\beta$ results in a less expressive latent space.
+In practice, when learning from demonstrations adopting CVAEs results in a slight modification to the VAE objective in <a href="#ELBO" data-reference-type="ref" data-reference="ELBO">[ELBO]</a>, which is adapted to
+``` math
+\begin{align}
+
+    \text{ELBO}_{\mathcal D}(\theta, \phi, \omega) = \sum_{i=0}^{N} \left(
+            \mathbb{E}_{z \sim q_\phi(\cdot \vert o_i, a_i)} \big[ \log p_\theta(a_i \vert z, o_i) \big]
+        - \text{D}_{\text{KL}}\big[ q_\phi(z \vert o_i, a_i) \Vert p_\omega(z \vert o_i) \big]
+        \right)
+\end{align}
+```
+Notice how in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> we are now also learning a new set of parameters $\omega$ for the prior distribution in the latent space. Effectively, this enables conditioning latent-space sampling (and thus reconstruction) during training, and potentially inference, providing useful when learning inherently conditional distributions like policies. Further, ACT is trained as a $\beta$-CVAE @higgins2017beta, using a weight of the KL regularization term in <a href="#c-ELBO" data-reference-type="ref" data-reference="c-ELBO">[c-ELBO]</a> as an hyperparameter regulating the information condensed in the latent space, where higher $\beta$ results in a less expressive latent space.
 
 In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn from human demonstrations compared to a simpler, supervised objective, $\mathcal L_1(a,a^\prime) = \Vert a - a^\prime \Vert_1$. Interestingly, they found the performance of these two approaches to be comparable when learning from *scripted* demonstrations. That is, when learning from data collected rolling out a predetermined set of commands $[q^c_0, q^c_1, \dots]$, GM did *not* prove competitive compared to standard supervised learning. However, when learning from human demonstrations--i.e., from data collected executing commands coming from a human controller $[q^h_0, q^h_1, \dots]$--they found performance (success rate on a downstream task) to be severily (-33.3%) hindered from adopting a standard supervised learning objective compared to a richer, potentially more complex to learn variational objective, in keeping with the multimodal nature of human demonstrations data and findings presented in @florenceImplicitBehavioralCloning2022. The authors also ablate the action chunking paradigm, reporting significant performance gains for performing action chunking (1% vs. 44% success rate). To avoid acting openloop, @zhaoLearningFineGrainedBimanual2023 design an inference process consisting in performing inference at every timestep $t$ and then aggregate overlapping chunks using chunks’ exponential moving average.
 
@@ -973,7 +1067,7 @@ In their work, @zhaoLearningFineGrainedBimanual2023 ablated using a GM to learn
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act" style="position: absolute;"></span>
 <figcaption>Action Chunking with Transformer (ACT), as in @zhaoLearningFineGrainedBimanual2023. ACT introduces an action chunking paradigm to cope with high-dimensional multi-modal demonstration data, and a transformer-based CVAE architecture.</figcaption>
 </figure>
 
@@ -987,7 +1081,7 @@ In ACT (Figure <a href="#ch4-act" data-reference-type="ref" data-reference="ch4
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act-encoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act-encoder" style="position: absolute;"></span>
 <figcaption>The CVAE encoder used in ACT. Input action chunks are first embedded and aggregated with positional embeddings, before being processed alongside embedded proprioperceptive information, and a learned <code>[CLS]</code> token used to aggregate input level information, and predict the style variable <span class="math inline"> <em>z</em> </span>. The encoder is entirely disregarded at inference time.</figcaption>
 </figure>
 
@@ -1001,7 +1095,7 @@ However, the authors claim using a deterministic procedure to derive $z$ may ben
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-act-decoder" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-act-decoder" style="position: absolute;"></span>
 <figcaption>The CVAE decoder used in ACT, comprising of a full encoder-decoder Transformer architecture. Camera observations from all <span class="math inline"> <em>n</em> </span> camera views are first embedded using pre-trained visual encoders, and then concatenated to the corresponding positional embeddings. Then, alongside embeddings for the proprioperceptive information available and the style variable <span class="math inline"> <em>z</em> </span> retrieved from the CVAE encoder, the Transformer encoder shares the matrices <span class="math inline"> <em>K</em>, <em>Q</em> </span> with the Transformer decoder, trained to decode fixed position embeddings into action valid chunks.</figcaption>
 </figure>
 
@@ -1011,13 +1105,17 @@ However, the authors claim using a deterministic procedure to derive $z$ may ben
 
 DMs proved very effective in approximating complex highly dimensional distributions, such as distributions over images @hoDenoisingDiffusionProbabilistic2020 or videos @polyakMovieGenCast2025, thanks to their inherent capability to deal with multimodal data and training stability. In Diffusion Policy (DP), @chiDiffusionPolicyVisuomotor2024 present an application of DMs the field of robot learning, leveraging diffusion to model human expert demonstrations in a variety of simulated and real-world tasks. Similarily to Action Chunking with Transformer @zhaoLearningFineGrainedBimanual2023, @chiDiffusionPolicyVisuomotor2024 (1) adopt a modified *observation-conditioned target distribution* instead of the full joint $p(o,a)$ and (2) predict multiple actions into the future instead of a single action. Besides the intractability of the observations’ marginal $p_\theta(o)$ given $p_\theta(o,a)$, DP’s rationale for modeling the data distribution via $p_\theta(a \vert o)$ stems from the rather test-time compute intensive nature of diffusion, whereby generating actions *alongside* observations is likely to result in higher complexity and thus a likely larger number of denoising operations, which would prove ultimately pointless considering robotics applications rely on the capability to generate controls rather than reproducing observations.
 
-In practice, conditioning on observation data is achieved conditioning the added noise regressor $\epsilon_\theta$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $T_o$ observations, resulting in the *conditional* simplified diffusion objective 
-
-$$
-`\htmlId{diffusion-policy-objective}{\mathcal L(\theta) = \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[ \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],\\ t \sim \mathcal{U}(\{1,\dots,T\}), \quad a_{t:t+T_a}, o_{t-T_o:t} \sim \mathcal{D}, \quad \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag}`
-$$
-
- Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $t$ *and* on a stack of previous observations $o_{t-T_o-t}$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
+In practice, conditioning on observation data is achieved conditioning the added noise regressor $\epsilon_\theta$ introduced in <a href="#diffusion-simplified-loss" data-reference-type="ref" data-reference="diffusion-simplified-loss">[diffusion-simplified-loss]</a> on a stack of $T_o$ observations, resulting in the *conditional* simplified diffusion objective
+``` math
+\begin{align}
+    \mathcal L(\theta) &= \mathbb{E}_{t, a_{t:t+H_a}, \epsilon} \big[
+        \Vert \epsilon - \epsilon_\theta(\sqrt{\bar \alpha_t} a_{t:t+T_a} + \epsilon \sqrt{1 - \bar \alpha_t}, t, o_{t-T_o:t}) \Vert^2 \big],  \\
+        & t \sim \mathcal{U}(\{1,\dots,T\}), \quad
+        a_{t:t+T_a}, o_{t-T_o:t} \sim \mathcal{D}, \quad
+        \epsilon \sim \mathcal{N}(\mathbf{0},\mathbf{I}). \notag 
+\end{align}
+```
+Notice how in <a href="#diffusion-policy-objective" data-reference-type="ref" data-reference="diffusion-policy-objective">[diffusion-policy-objective]</a> the noise regressor is conditioned both on the latent variable rank $t$ *and* on a stack of previous observations $o_{t-T_o-t}$.  @chiDiffusionPolicyVisuomotor2024 claim the combination of (1) conditioning on a horizon of previous observations and (2) predicting multiple actions into the future allows DP to *commit to specific modes* in the data at inference time, which proves essential for good performance and avoiding undecisiveness.
 
 <figure>
 <ResponsiveImage
@@ -1027,7 +1125,7 @@ $$
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="diffusion-policy-architecture" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="diffusion-policy-architecture" style="position: absolute;"></span>
 <figcaption>The Diffusion Policy archicture, as in @chiDiffusionPolicyVisuomotor2024. A stack of <span class="math inline"> <em>H</em> <sub> <em>o</em> </sub> </span> previous observations is used as external conditioning to denoise a group of <span class="math inline"> <em>H</em> <sub> <em>a</em> </sub> </span> actions. Conditioning is used at every layer of a U-Net block, and in practice allows to obtain fully-formed action chunks with as little as <span class="math inline"> <em>T</em> = 10</span> denoising steps.</figcaption>
 </figure>
 
@@ -1058,7 +1156,7 @@ We directly assess the lack of adaptiveness of robot systems due to acting open-
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-async-inference" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-async-inference" style="position: absolute;"></span>
 </div>
 <figcaption><strong>Asynchronous inference</strong>. Illustration of the asynchronous inference stack. Note that the policy can be run on a remote server, possibly with GPUs.</figcaption>
 </figure>
@@ -1101,7 +1199,7 @@ Interestingly, the behavior of async inference can be studied analytically. Firs
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch4-queues" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch4-queues" style="position: absolute;"></span>
 </div>
 <figcaption>Action queue size evolution at runtime for various levels of <span class="math inline"> <em>g</em> </span> when (A) not filtering out observation based on joint-space similarity and (B) filtering out near-duplicates observation, measuring their similarity in joint-space.</figcaption>
 </figure>
@@ -1135,7 +1233,7 @@ The advent of large models trained on internet-scale datasets has drastically in
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-ml-vs-robotics-foundation" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-ml-vs-robotics-foundation" style="position: absolute;"></span>
 <figcaption>Fields within ML such as Computer Vision and NLP converged on the development of foundation models, trained on a variety of large scale models and capable to perform multiple downstream tasks (top). Conversely, robotics suffered from limited standardization in terms of the architectures used, and siloed, task specific datasets, incurring in a high degree of fragmentation which traditionally hindered the development of generalist models for robotics in favour of task-specific models (bottom).</figcaption>
 </figure>
 
@@ -1151,7 +1249,7 @@ The remarkable success of foundation models in NLP and CV is predicated on two c
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-generalist-policies-timeline" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-generalist-policies-timeline" style="position: absolute;"></span>
 <figcaption>Early efforts in the development of generalist models for robotics include BC-Zero @jangBCZZeroShotTask2022, RT-1 @brohanRT1RoboticsTransformer2023, and RT-2 @brohanRT2VisionLanguageActionModels2023: large scale models trained on thousands of demonstrations. The open release of the Open-X @collaborationOpenXEmbodimentRobotic2025 and DROID datasets @khazatskyDROIDLargeScaleInTheWild2025 fostered the development of open source models: OpenVLA @kimOpenVLAOpenSourceVisionLanguageAction2024, <span class="math inline"> <em>π</em> <sub>0</sub> </span> @blackp0VisionLanguageActionFlow2024 and SmolVLA @shukorSmolVLAVisionLanguageActionModel2025.</figcaption>
 </figure>
 
@@ -1171,7 +1269,7 @@ The success of large, proprietary models like RT-1 and RT-2, highlighted a growi
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-trends" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-trends" style="position: absolute;"></span>
 <figcaption>Robot learning is undergoing a paradigmatic shift: centralized data collections (A, left) are increasingly larger, often comprising Ms of demonstrations, and (A, right) decentralized approaches to data collection are also rising as an alternative for large scale data collection. (B) Generalist models are also becoming increasingly smaller and easier to run on limited hardware.</figcaption>
 </figure>
 
@@ -1201,19 +1299,30 @@ $\pi_0$ @blackp0VisionLanguageActionFlow2024 introduce a VLA consisting of a Mo
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-pi0" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-pi0" style="position: absolute;"></span>
 <figcaption>The <span class="math inline"> <em>π</em> <sub>0</sub> </span>architecture, as in @blackp0VisionLanguageActionFlow2024. Vision and language tokens are routed to a VLM backbone which is prevented from attending robot proprioperceptive states and action tokens, which are instead routed to a smaller subset of weights within the architecture. The architecture is trained with Flow Matching on 10M+ trajectories from a mixture of closed and openly available datasets.</figcaption>
 </figure>
 
 Concretely, $\pi_0$ is a unified transformer with two disjoint sets of weights $\phi, \theta$. A larger VLM backbone $p_\phi$ initialized from Gemma 2.6B processes multiple image frames obtained from multiple cameras points $[\{ I_t \}_{t=1}^n]$, as well as a language instruction $[\ell_t]$ used to describe the task considered. Concurrently, a 300M-parameter *action expert* based on a similar transformer architecture is used processes the robot proprioperceptive state $q_t$ and an action chunk $a_{t:t+H_a}$ (Figure <a href="#ch5-pi0" data-reference-type="ref" data-reference="ch5-pi0">[ch5-pi0]</a>). The different expert networks operate separately in processing the respective inputs and turning them into query, key and value matrices, and only share information between each other via self-attention layers. The outputs from the VLM backbone are disregarded, while the vector field regressed by the action expert is used to iteratively refine the action process. In particular, $\pi_0$uses a *blockwise causal attention mask* over tokens belonging to three separate blocks: (1) image and language tokens $\mathcal T_i$ obtained from $[\{ I_t \}_{t=1}^n, \ell_t]$, (2) proprioperceptive tokens $\mathcal T_q$ obtained from $q_t$, and (3) the action tokens $\mathcal T_a$ for items in the chunk $a^{\tau}_{t:t+H_a}$ at time $\tau$ in the flow-matching process. Notably, *within* each block the attention operations are bidirectional, while across blocks, future blocks are masked out. Formally, this corresponds to using the attention mask $\mathbf{A} = \bordermatrix{ \mathcal{T}_i \mathcal{T}_q \mathcal{T}_a \cr \mathcal{T}_i \mathbf{1} \mathbf{0} \mathbf{0} \cr \mathcal{T}_q \mathbf{1} \mathbf{1} \mathbf{0} \cr \mathcal{T}_a \mathbf{1} \mathbf{1} \mathbf{1} \cr }, \quad \mathbf{1}: \text{Bidirectional Attention}, \ \mathbf{0}: \text{Masked Attention}$ Note how *intra*-block directional attention allows tokens to communicate freely, while *inter*-block communication is mediated by the attention mask $\mathbf{A}$. *Blockwise causal masking* effectively prevents the pre-trained perception-language tokens from attending to robotics-tokens, likely out of distribution for VLM backbones traditionally trained on large corpora of internet, non-robotics, data. Crucially, because communication is obstructed between image-language tokens, proprioperceptive and action tokens, one can cache keys and values across denoising steps at runtime time, incuring in a reduced computational footprint and faster inference.
 
-In $\pi_0$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing: 
+In $\pi_0$, both the VLM backbone and action expert are update using a *flow matching* loss, and in particular are updated minimizing:
+``` math
+\begin{align}
+    \mathcal{L}(\phi, \theta) &= 
+    \mathbb{E}_{\tau, \epsilon, o_t, a_{t:t+H_a}}\Big[
+        \big\Vert 
+            v_\theta(\underbrace{\tau a_{t:t+H_a} + (1-\tau) \epsilon}_{\tilde a_{t:t+H_a}},\, o_t,\, \tau)
+            - (\epsilon - a_{t:t+H_a})
+        \big\Vert^2
+    \Big],  \\
+    &\tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad
+    \epsilon \sim \mathcal{N}(\mathbf{0}, \mathbf{I}), \quad
+    o_t, a_{t:t+H_a} \sim \mathcal D \notag
+\end{align}
+```
 
-$$
-`\htmlId{pi0-loss}{\mathcal{L}(\phi, \theta) = \mathbb{E}_{\tau, \epsilon, o_t, a_{t:t+H_a}}\Big[ \big\Vert v_\theta(\underbrace{\tau a_{t:t+H_a} + (1-\tau) \epsilon}_{\tilde a_{t:t+H_a}},\, o_t,\, \tau) - (\epsilon - a_{t:t+H_a}) \big\Vert^2 \Big],\\ \tau \sim \mathrm{Beta}_{[0,s]}(1.5,1), \quad \epsilon \sim \mathcal{N}(\mathbf{0}, \mathbf{I}), \quad o_t, a_{t:t+H_a} \sim \mathcal D \notag}`
-$$
+Where the experts parametrized by the separate weights $\phi, \theta$ interact with each other via self-attention layers only, so that the action expert $v_\theta$ internal computations also depend on the VLM backbone’s parameters $\phi$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
 
- Where the experts parametrized by the separate weights $\phi, \theta$ interact with each other via self-attention layers only, so that the action expert $v_\theta$ internal computations also depend on the VLM backbone’s parameters $\phi$. Importantly, @blackp0VisionLanguageActionFlow2024 minimize <a href="#pi0-loss" data-reference-type="ref" data-reference="pi0-loss">[pi0-loss]</a> over both the multimodal backbone and action expert parameters, thus updating the internal representations of the VLM using BC-specific gradients. In contrast, @driessKnowledgeInsulatingVisionLanguageAction2025 later show that failing to insulate the VLM knowledge from the flow matching gradients actually harms performance. Inference is performed iteratively refining action chunks while numerically forward-integrating the vector field predicted by the action expert,
 ``` math
 \begin{equation}
     a_{t:t+H_a}^{\tau + \delta} = a_{t:t+H_a}^{\tau } + \delta v_\theta(a_{t:t+H_a}^{\tau }, o_t)
@@ -1255,7 +1364,7 @@ VLAs remain in an early stage of development and are not yet as mature or widely
   layout="fixed"
   alt="Figure"
 />
-<p>&lt;span id="ch5-smolvla" style="position: absolute;"&gt;&lt;/span&gt;</p>
+<span id="ch5-smolvla" style="position: absolute;"></span>
 <figcaption>The SmolVLA architecture, as in @shukorSmolVLAVisionLanguageActionModel2025. SmolVLA is a compact MoE model trained with flow matching to denoise action chunks. Vision and language tokens are fed to a VLM backbone, and share information with the proprioperceptive and action tokens via the attention mechanism. The attention expert interleaves SA and CA layers for further conditioning on the visual features from the VLM backbone. SmolVLA skips computations and reduces the visual tokens, resulting in 6x less memory usage than <span class="math inline"> <em>π</em> <sub>0</sub> </span>.</figcaption>
 </figure>
 
diff --git a/app/src/content/embeds/banner.html b/app/src/content/embeds/banner.html
new file mode 100644
index 0000000000000000000000000000000000000000..1ad415ed788791dcb7eec078aea3fda6d4d8907c
--- /dev/null
+++ b/app/src/content/embeds/banner.html
@@ -0,0 +1,267 @@
+<div class="d3-galaxy" style="width:100%;margin:10px 0;aspect-ratio:3/1;min-height:260px;"></div>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) {
+        s = document.createElement('script');
+        s.id = 'd3-cdn-script';
+        s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js';
+        document.head.appendChild(s);
+      }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const mount = document.currentScript ? document.currentScript.previousElementSibling : null;
+      const container = (mount && mount.querySelector && mount.querySelector('.d3-galaxy')) || document.querySelector('.d3-galaxy');
+      if (!container) return;
+      if (container.dataset) {
+        if (container.dataset.mounted === 'true') return;
+        container.dataset.mounted = 'true';
+      }
+      // Scene params (match previous Plotly ranges)
+      const cx = 1.5, cy = 0.5;
+      const a = 1.3, b = 0.45;
+      const numPoints = 3000; 
+      const numArms = 3;
+      const numTurns = 2.1;
+      const angleJitter = 0.12;
+      const posNoise = 0.015;
+
+      // Generate spiral + bulge
+      const twoPi = Math.PI * 2;
+      const t = Float64Array.from({ length: numPoints }, () => Math.random() * (twoPi * numTurns));
+      const armIndices = Int16Array.from({ length: numPoints }, () => Math.floor(Math.random() * numArms));
+      const armOffsets = Float64Array.from(armIndices, (k) => k * (twoPi / numArms));
+      const theta = Float64Array.from(t, (tv, i) => tv + armOffsets[i] + d3.randomNormal.source(Math.random)(0, angleJitter)());
+      const rNorm = Float64Array.from(t, (tv) => Math.pow(tv / (twoPi * numTurns), 0.9));
+      const noiseScale = (rn) => posNoise * (0.8 + 0.6 * rn);
+      const noiseX = Float64Array.from(rNorm, (rn) => d3.randomNormal.source(Math.random)(0, noiseScale(rn))());
+      const noiseY = Float64Array.from(rNorm, (rn) => d3.randomNormal.source(Math.random)(0, noiseScale(rn))());
+
+      const xSpiral = Float64Array.from(theta, (th, i) => cx + a * rNorm[i] * Math.cos(th) + noiseX[i]);
+      const ySpiral = Float64Array.from(theta, (th, i) => cy + b * rNorm[i] * Math.sin(th) + noiseY[i]);
+
+      const bulgePoints = Math.floor(0.18 * numPoints);
+      const phiB = Float64Array.from({ length: bulgePoints }, () => twoPi * Math.random());
+      const rB = Float64Array.from({ length: bulgePoints }, () => Math.pow(Math.random(), 2.2) * 0.22);
+      const noiseXB = Float64Array.from({ length: bulgePoints }, () => d3.randomNormal.source(Math.random)(0, posNoise * 0.6)());
+      const noiseYB = Float64Array.from({ length: bulgePoints }, () => d3.randomNormal.source(Math.random)(0, posNoise * 0.6)());
+      const xBulge = Float64Array.from(phiB, (ph, i) => cx + a * rB[i] * Math.cos(ph) + noiseXB[i]);
+      const yBulge = Float64Array.from(phiB, (ph, i) => cy + b * rB[i] * Math.sin(ph) + noiseYB[i]);
+
+      // Concatenate
+      const X = Array.from(xSpiral).concat(Array.from(xBulge));
+      const Y = Array.from(ySpiral).concat(Array.from(yBulge));
+      const lenSpiral = xSpiral.length;
+
+      const zSpiral = Array.from(rNorm, (rn) => 1 - rn);
+      const maxRB = rB && rB.length ? (window.d3 && d3.max ? d3.max(rB) : Math.max.apply(null, Array.from(rB))) : 1;
+      const zBulge = Array.from(rB, (rb) => 1 - (maxRB ? rb / maxRB : 0));
+      const Zraw = zSpiral.concat(zBulge);
+      const sizesPx = Zraw.map((z) => (z + 1) * 5); // 5..10 px (diameter)
+
+      // Labels (same categories as Python version)
+      const labelOf = (i) => {
+        const z = Zraw[i];
+        if (z < 0.25) return 'smol dot';
+        if (z < 0.5) return 'ok-ish dot';
+        if (z < 0.75) return 'a dot';
+        return 'biiig dot';
+      };
+
+      // Sort by size ascending for z-index: small first, big last
+      const idx = d3.range(X.length).sort((i, j) => sizesPx[i] - sizesPx[j]);
+
+      // Colors: piecewise gradient [0 -> 0.5 -> 1]
+      const c0 = d3.rgb(78, 165, 183);    // rgb(78, 165, 183)
+      const c1 = d3.rgb(206, 192, 250);   // rgb(206, 192, 250)
+      const c2 = d3.rgb(232, 137, 171);   // rgb(232, 137, 171)
+      const interp01 = d3.interpolateRgb(c0, c1);
+      const interp12 = d3.interpolateRgb(c1, c2);
+      const colorFor = (v) => {
+        const t = Math.max(0, Math.min(1, v));
+        return t <= 0.5 ? interp01(t / 0.5) : interp12((t - 0.5) / 0.5);
+      };
+
+      // Create SVG
+      const svg = d3.select(container).append('svg')
+        .attr('width', '100%')
+        .style('display', 'block')
+        .style('cursor', 'crosshair');
+
+      const render = () => {
+        const width = container.clientWidth || 800;
+        const height = Math.max(260, Math.round(width / 3)); // keep ~3:1, min height
+        svg.attr('width', width).attr('height', height);
+
+        const xScale = d3.scaleLinear().domain([0, 3]).range([0, width]);
+        const yScale = d3.scaleLinear().domain([0, 1]).range([height, 0]);
+
+        // Subtle stroke color depending on theme
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        const strokeColor = isDark ? 'rgba(255,255,255,0.18)' : 'rgba(0,0,0,0.12)';
+        const glowColor = isDark ? 'rgba(255,255,255,0.35)' : 'rgba(0,0,0,0.25)';
+
+
+        // Group for points (no blend mode for better print/PDF visibility)
+        const g = svg.selectAll('g.points').data([0]).join('g').attr('class', 'points');
+
+        // Ensure container can host an absolute tooltip
+        container.style.position = container.style.position || 'relative';
+        let tip = container.querySelector('.d3-tooltip');
+        let tipInner;
+        if (!tip) {
+          tip = document.createElement('div');
+          tip.className = 'd3-tooltip';
+          Object.assign(tip.style, {
+            position: 'absolute',
+            top: '0px',
+            left: '0px',
+            transform: 'translate(-9999px, -9999px)',
+            pointerEvents: 'none',
+            padding: '10px 12px',
+            borderRadius: '12px',
+            fontSize: '12px',
+            lineHeight: '1.35',
+            border: '1px solid var(--border-color)',
+            background: 'var(--surface-bg)',
+            color: 'var(--text-color)',
+            boxShadow: '0 8px 32px rgba(0,0,0,.28), 0 2px 8px rgba(0,0,0,.12)',
+            opacity: '0',
+            transition: 'opacity .12s ease',
+            backdropFilter: 'saturate(1.12) blur(8px)',
+            zIndex: '20'
+          });
+          tipInner = document.createElement('div');
+          tipInner.className = 'd3-tooltip__inner';
+          Object.assign(tipInner.style, {
+            textAlign: 'left',
+            display: 'flex',
+            flexDirection: 'column',
+            gap: '6px',
+            minWidth: '220px'
+          });
+          tip.appendChild(tipInner);
+          container.appendChild(tip);
+        } else {
+          tipInner = tip.querySelector('.d3-tooltip__inner') || tip;
+        }
+
+        // Final filter: remove small dots very close to the galaxy center (after placement)
+        const centerHoleRadius = 0.48; // elliptical radius threshold
+        const smallSizeThreshold = 7.5; // same notion as Python size cut
+        const rTotal = idx.map((i) => Math.sqrt(((X[i] - cx) / a) ** 2 + ((Y[i] - cy) / b) ** 2));
+        const idxFiltered = idx.filter((i, k) => !(rTotal[k] <= centerHoleRadius && sizesPx[i] < smallSizeThreshold));
+
+        const sel = g.selectAll('circle').data(idxFiltered, (i) => i);
+        sel.join(
+          (enter) => enter.append('circle')
+            .attr('cx', (i) => xScale(X[i]))
+            .attr('cy', (i) => yScale(Y[i]))
+            .attr('r', (i) => sizesPx[i] / 2)
+            .attr('fill', (i) => colorFor(Zraw[i]))
+            .attr('fill-opacity', 0.9)
+            .attr('stroke', strokeColor)
+            .attr('stroke-width', 0.4)
+            .on('mouseenter', function(ev, i) {
+              d3.select(this).raise()
+                .style('filter', `drop-shadow(0 0 8px ${glowColor})`)
+                .transition().duration(120).ease(d3.easeCubicOut)
+                .attr('stroke', isDark ? 'rgba(255,255,255,0.85)' : 'rgba(0,0,0,0.85)')
+                .attr('stroke-width', 1.4)
+                .attr('r', (sizesPx[i] / 2) * 1.25)
+                .attr('fill-opacity', 1);
+              const r = Math.sqrt(((X[i] - cx) / a) ** 2 + ((Y[i] - cy) / b) ** 2);
+              const type = i < lenSpiral ? 'spiral' : 'bulge';
+              const arm = i < lenSpiral ? (armIndices[i] + 1) : null;
+              tipInner.innerHTML =
+                `<div style="font-weight:800;letter-spacing:.1px;"><strong>${labelOf(i)}</strong></div>` +
+                `<div style="font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;letter-spacing:.1px;"><strong>Type</strong> ${type}${arm ? ` (Arm ${arm})` : ''}</div>` +
+                `<div style="padding-top:6px;border-top:1px solid var(--border-color);"><strong>Position</strong> X ${X[i].toFixed(2)} · <strong>Y</strong> ${Y[i].toFixed(2)}</div>` +
+                `<div><strong>Distance</strong> Radius ${r.toFixed(3)} · <strong>Z</strong> ${Zraw[i].toFixed(3)}</div>` +
+                `<div><strong>Size</strong> ${sizesPx[i].toFixed(1)} px</div>`;
+              tip.style.opacity = '1';
+            })
+            .on('mousemove', (ev, i) => {
+              const [mx, my] = d3.pointer(ev, container);
+              const offsetX = 10, offsetY = 12;
+              tip.style.transform = `translate(${Math.round(mx + offsetX)}px, ${Math.round(my + offsetY)}px)`;
+            })
+            .on('mouseleave', function() {
+              tip.style.opacity = '0';
+              tip.style.transform = 'translate(-9999px, -9999px)';
+              d3.select(this)
+                .style('filter', null)
+                .transition().duration(120).ease(d3.easeCubicOut)
+                .attr('stroke', strokeColor)
+                .attr('stroke-width', 0.4)
+                .attr('r', (i2) => sizesPx[i2] / 2)
+                .attr('fill-opacity', 0.9);
+            }),
+          (update) => update
+            .attr('cx', (i) => xScale(X[i]))
+            .attr('cy', (i) => yScale(Y[i]))
+            .attr('r', (i) => sizesPx[i] / 2)
+            .attr('fill', (i) => colorFor(Zraw[i]))
+            .attr('fill-opacity', 0.9)
+            .attr('stroke', strokeColor)
+            .attr('stroke-width', 0.4)
+            .on('mouseenter', function(ev, i) {
+              d3.select(this).raise()
+                .style('filter', `drop-shadow(0 0 8px ${glowColor})`)
+                .transition().duration(120).ease(d3.easeCubicOut)
+                .attr('stroke', isDark ? 'rgba(255,255,255,0.85)' : 'rgba(0,0,0,0.85)')
+                .attr('stroke-width', 1.4)
+                .attr('r', (sizesPx[i] / 2) * 1.25)
+                .attr('fill-opacity', 1);
+              const r = Math.sqrt(((X[i] - cx) / a) ** 2 + ((Y[i] - cy) / b) ** 2);
+              const type = i < lenSpiral ? 'spiral' : 'bulge';
+              const arm = i < lenSpiral ? (armIndices[i] + 1) : null;
+              tipInner.innerHTML =
+                `<div style="font-weight:800;letter-spacing:.1px;"><strong>${labelOf(i)}</strong></div>` +
+                `<div style="font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;letter-spacing:.1px;"><strong>Type</strong> ${type}${arm ? ` (Arm ${arm})` : ''}</div>` +
+                `<div style="padding-top:6px;border-top:1px solid var(--border-color);"><strong>Position</strong> X ${X[i].toFixed(2)} · <strong>Y</strong> ${Y[i].toFixed(2)}</div>` +
+                `<div><strong>Distance</strong> Radius ${r.toFixed(3)} · <strong>Z</strong> ${Zraw[i].toFixed(3)}</div>` +
+                `<div><strong>Size</strong> ${sizesPx[i].toFixed(1)} px</div>`;
+              tip.style.opacity = '1';
+            })
+            .on('mousemove', (ev, i) => {
+              const [mx, my] = d3.pointer(ev, container);
+              const offsetX = 10, offsetY = 12;
+              tip.style.transform = `translate(${Math.round(mx + offsetX)}px, ${Math.round(my + offsetY)}px)`;
+            })
+            .on('mouseleave', function() {
+              tip.style.opacity = '0';
+              tip.style.transform = 'translate(-9999px, -9999px)';
+              d3.select(this)
+                .style('filter', null)
+                .transition().duration(120).ease(d3.easeCubicOut)
+                .attr('stroke', strokeColor)
+                .attr('stroke-width', 0.4)
+                .attr('r', (i2) => sizesPx[i2] / 2)
+                .attr('fill-opacity', 0.9);
+            })
+        );
+      };
+
+      // First render + resize
+      if (window.ResizeObserver) {
+        const ro = new ResizeObserver(() => render());
+        ro.observe(container);
+      } else {
+        window.addEventListener('resize', render);
+      }
+      render();
+    };
+
+    if (document.readyState === 'loading') {
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true });
+    } else { ensureD3(bootstrap); }
+  })();
+</script>
+
diff --git a/app/src/content/embeds/d3-bar.html b/app/src/content/embeds/d3-bar.html
new file mode 100644
index 0000000000000000000000000000000000000000..15a6766e601399392e2192b14c7f21f751e76d35
--- /dev/null
+++ b/app/src/content/embeds/d3-bar.html
@@ -0,0 +1,317 @@
+<div class="d3-bar"  ></div>
+<style>
+  .d3-bar .controls { margin-top: 0; display: flex; gap: 16px; align-items: center; justify-content: flex-end; flex-wrap: wrap; }
+  .d3-bar .controls .control-group { display: flex; flex-direction: column; align-items: flex-start; gap: 6px; }
+  .d3-bar .controls label { font-size: 12px; color: var(--text-color); font-weight: 700; }
+  .d3-bar .controls select { font-size: 12px; padding: 8px 28px 8px 10px; border: 1px solid var(--border-color); border-radius: 8px; background-color: var(--surface-bg); color: var(--text-color); background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E"); background-repeat: no-repeat; background-position: right 8px center; background-size: 12px; -webkit-appearance: none; -moz-appearance: none; appearance: none; cursor: pointer; transition: border-color .15s ease, box-shadow .15s ease; }
+  [data-theme="dark"] .d3-bar .controls select { background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E"); }
+  .d3-bar .controls select:hover { border-color: var(--primary-color); }
+  .d3-bar .controls select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+  /* Header (legend + controls) placed after chart */
+  .d3-bar .chart-header { display: flex; align-items: flex-start; justify-content: flex-start; gap: 12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+  .d3-bar .legend-bottom { display: flex; flex-direction: column; align-items: flex-start; gap: 6px; font-size: 12px; color: var(--text-color); }
+  .d3-bar .legend-bottom .legend-title { font-size: 12px; font-weight: 700; color: var(--text-color); }
+  .d3-bar .legend-bottom .items { display: flex; flex-wrap: wrap; gap: 8px 14px; }
+  .d3-bar .legend-bottom .item { display: inline-flex; align-items: center; gap: 6px; white-space: nowrap; }
+  .d3-bar .legend-bottom .swatch { width: 14px; height: 14px; border-radius: 3px; border: 1px solid var(--border-color); display: inline-block; }
+  .d3-bar.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .d3-bar.hovering .bars path.ghost { opacity: .35; }
+  .d3-bar .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  /* Apply axis/tick/grid purely via CSS */
+  .d3-bar .axes path,
+  .d3-bar .axes line { stroke: var(--axis-color); }
+  .d3-bar .axes text { fill: var(--tick-color); }
+  .d3-bar .grid line { stroke: var(--grid-color); }
+  /* Tooltip improvements */
+  .d3-bar .d3-tooltip { z-index: var(--z-tooltip); backdrop-filter: saturate(1.12) blur(8px); }
+  /* Hover/transition styling for bars and legend */
+  .d3-bar .bars path.bar { transition: opacity .12s ease, stroke .12s ease, stroke-width .12s ease; }
+  .d3-bar .bars path.bar.highlight { stroke: none; stroke-width: 0; }
+  .d3-bar.hovering .bars path.ghost { opacity: .25; }
+  .d3-bar .legend-bottom .item.hovered { color: inherit; }
+  .d3-bar .legend-bottom .item.hovered .swatch { border-color: var(--border-color); }
+  .d3-bar .d3-tooltip .swatch { width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); display: inline-block; margin-right: 6px; vertical-align: -2px; }
+  /* Chart card wrapper */
+  .d3-bar .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  /* Layout adjustments to give controls more space */
+  .d3-bar .chart-header {
+    padding-left: 8px;
+    padding-right: 8px;
+    gap: 20px;
+  }
+  .d3-bar .controls {
+    justify-content: flex-start;
+    min-width: 320px;
+  }
+  .d3-bar .controls .control-group {
+    min-width: 150px;
+  }
+  .d3-bar .controls select {
+    font-size: 13px;
+    min-width: 160px;
+  }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const mount = document.currentScript ? document.currentScript.previousElementSibling : null;
+      const container = (mount && mount.querySelector && mount.querySelector('.d3-bar')) || document.querySelector('.d3-bar');
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Data, matching bar.py
+      const seqLabels = ["1024","2048","4096","8192"];
+      const seqScale = [1,2,4,8];
+      const componentKeys = ['parameters','gradients','optimizer','activations'];
+      const modelSizes = ["1B","3B","8B","70B","405B"];
+      const paramsMem = { "1B":4.0, "3B":13.3, "8B":26.0, "70B":244.0, "405B":1520.0 };
+      const actCoeff = { "1B":3.6, "3B":9.3, "8B":46.2, "70B":145.7, "405B":1519.9 };
+      const recomputeModes = ["none","selective","full"];
+
+      const activationsCurve = (sizeKey, mode) => {
+        const coeff = actCoeff[sizeKey];
+        let arr = seqScale.map((v) => coeff * (v * v));
+        if (mode === 'selective') arr = arr.map((v) => v * 0.25);
+        else if (mode === 'full') arr = arr.map((v) => v * (1 / 16));
+        return arr;
+      };
+      const stackFor = (sizeKey, mode) => {
+        const p = seqScale.map(() => paramsMem[sizeKey]);
+        const g = seqScale.map(() => paramsMem[sizeKey]);
+        const o = seqScale.map(() => 2*paramsMem[sizeKey]);
+        const a = activationsCurve(sizeKey, mode);
+        return { parameters: p, gradients: g, optimizer: o, activations: a };
+      };
+
+      const Y = {}; // Y[mode][size][component] => array
+      recomputeModes.forEach((m) => {
+        Y[m] = {}; modelSizes.forEach((s) => { Y[m][s] = stackFor(s, m); });
+      });
+
+      // Controls
+      const controls = document.createElement('div');
+      controls.className = 'controls';
+      const groupSize = document.createElement('div'); groupSize.className = 'control-group';
+      const labelSize = document.createElement('label'); labelSize.textContent = 'Model Size';
+      const selSize = document.createElement('select'); modelSizes.forEach((s) => { const o = document.createElement('option'); o.value = s; o.textContent = s; selSize.appendChild(o); });
+      groupSize.appendChild(labelSize); groupSize.appendChild(selSize);
+      const groupRecomp = document.createElement('div'); groupRecomp.className = 'control-group';
+      const labelRecomp = document.createElement('label'); labelRecomp.textContent = 'Recomputation';
+      const selRecomp = document.createElement('select'); recomputeModes.forEach((m) => { const o = document.createElement('option'); o.value = m; o.textContent = m; selRecomp.appendChild(o); });
+      groupRecomp.appendChild(labelRecomp); groupRecomp.appendChild(selRecomp);
+
+      // Header (legend + controls) to be placed after chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom';
+      const legendTitle = document.createElement('div'); legendTitle.className = 'legend-title'; legendTitle.textContent = 'Legend';
+      const legendItems = document.createElement('div'); legendItems.className = 'items';
+      legendBottom.appendChild(legendTitle); legendBottom.appendChild(legendItems);
+      header.appendChild(legendBottom);
+      header.appendChild(controls);
+      // SVG scaffolding inside a card wrapper
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      // Place header after the chart card
+      container.appendChild(header);
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gBars = gRoot.append('g').attr('class','bars');
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) { tip = document.createElement('div'); tip.className = 'd3-tooltip'; Object.assign(tip.style,{ position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none', padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)', background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease' }); tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip); } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // State
+      let currentSize = modelSizes[0];
+      let currentMode = 'selective';
+      selRecomp.value = currentMode;
+
+      // Layout & scales
+      let width=800, height=360; const margin = { top: 16, right: 28, bottom: 56, left: 64 };
+      const x0 = d3.scaleBand().paddingInner(0.25).paddingOuter(0.1); // groups (seq)
+      const y = d3.scaleLinear();
+      function getCategoricalColors(count){
+        try {
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            return window.ColorPalettes.getColors('categorical', count);
+          }
+        } catch(_) {}
+        const primary = getComputedStyle(document.documentElement).getPropertyValue('--primary-color').trim() || '#E889AB';
+        const tableau = (window.d3 && window.d3.schemeTableau10) ? window.d3.schemeTableau10 : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'];
+        const pool = [primary, ...tableau];
+        const arr = []; for (let i=0;i<count;i++){ arr.push(pool[i % pool.length]); }
+        return arr;
+      }
+      const palette = getCategoricalColors(componentKeys.length);
+      const colorMap = new Map(componentKeys.map((k,i)=>[k, palette[i]]));
+      const colorOf = (key) => colorMap.get(key) || 'var(--primary-color)';
+
+      function yMax(sizeKey, mode){
+        const s = Y[mode][sizeKey];
+        let max = 0; for (let i=0;i<seqLabels.length;i++){ const sum = s.parameters[i]+s.gradients[i]+s.optimizer[i]+s.activations[i]; if (sum>max) max=sum; }
+        return max*1.05;
+      }
+
+      function renderLegend(){
+        legendItems.innerHTML = componentKeys.map((key, i) => {
+          const color = palette[i];
+          return `<span class="item" data-key="${key}"><span class=\"swatch\" style=\"background:${color}\"></span><span>${key}</span></span>`;
+        }).join('');
+        legendItems.querySelectorAll('.item').forEach((el) => {
+          el.addEventListener('mouseenter', () => {
+            const k = el.getAttribute('data-key'); if (!k) return;
+            container.classList.add('hovering');
+            gBars.selectAll('path.bar').classed('ghost', d => d && d.key !== k);
+            legendItems.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-key') !== k));
+          });
+          el.addEventListener('mouseleave', () => {
+            container.classList.remove('hovering');
+            gBars.selectAll('path.bar').classed('ghost', false);
+            legendItems.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+          });
+        });
+      }
+
+      function updateScales(){
+        width = container.clientWidth || 800; height = Math.max(260, Math.round(width/3)); svg.attr('width', width).attr('height', height);
+        const innerWidth = width - margin.left - margin.right; const innerHeight = height - margin.top - margin.bottom; gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+
+        x0.domain(seqLabels).range([0, innerWidth]);
+        y.domain([0, yMax(currentSize, currentMode)]).range([innerHeight, 0]).nice();
+
+        // Grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(y.ticks(6)).join('line')
+          .attr('x1', 0).attr('x2', innerWidth).attr('y1', (d)=>y(d)).attr('y2', (d)=>y(d))
+          .attr('stroke', 'var(--grid-color)').attr('stroke-width', 1).attr('shape-rendering', 'crispEdges');
+
+        // Axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(x0)).call((g)=>{ g.selectAll('path, line').attr('stroke', 'var(--axis-color)'); g.selectAll('text').attr('fill', 'var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(y).ticks(6).tickFormat(d3.format('~f'))).call((g)=>{ g.selectAll('path, line').attr('stroke', 'var(--axis-color)'); g.selectAll('text').attr('fill', 'var(--tick-color)').style('font-size','12px'); });
+
+        // Axis labels
+        gAxes.append('text').attr('class','axis-label axis-label--x').attr('x', innerWidth/2).attr('y', innerHeight + 44).attr('text-anchor','middle').text('Sequence Length');
+        gAxes.append('text').attr('class','axis-label axis-label--y').attr('text-anchor','middle').attr('transform', `translate(${-52},${innerHeight/2}) rotate(-90)`).text('Memory (GB)');
+
+        renderLegend();
+
+        return { innerWidth, innerHeight };
+      }
+
+      function drawBars(){
+        const stacks = Y[currentMode][currentSize];
+        const series = componentKeys.map((key, i)=>({ key, color: palette[i], values: stacks[key] }));
+        // Stack values
+        const stacked = seqLabels.map((label, i) => {
+          let acc = 0; const items = [];
+          series.forEach((s, idx) => {
+            const y0 = acc; const y1 = acc + s.values[i];
+            items.push({ key: s.key, color: s.color, i, y0, y1, xLabel: label, value: s.values[i], isBottom: idx === 0, isTop: idx === series.length - 1 });
+            acc = y1;
+          });
+          const total = acc;
+          items.forEach(it => { it.total = total; });
+          return { label, items };
+        });
+
+        const { innerWidth, innerHeight } = updateScales();
+
+        const bandWidth = x0.bandwidth();
+        const groups = gBars.selectAll('g.bar-group').data(stacked, d=>d.label);
+        const groupsEnter = groups.enter().append('g').attr('class','bar-group');
+        groupsEnter.merge(groups).attr('transform', (d)=>`translate(${x0(d.label)},0)`);
+        groups.exit().remove();
+
+        // Helper to draw per-corner rounded rectangle path
+        const rCorner = 4;
+        const roundedPath = (x, yTop, w, h, isTop, isBottom) => {
+          const r = Math.min(rCorner, Math.max(0, Math.min(w, h) / 2));
+          const rTL = isTop ? r : 0, rTR = isTop ? r : 0, rBR = isBottom ? r : 0, rBL = isBottom ? r : 0;
+          const x0 = x, y0 = yTop, x1 = x + w, y1 = yTop + h;
+          return `M${x0 + rTL},${y0}`
+            + `H${x1 - rTR}`
+            + (rTR ? `Q${x1},${y0} ${x1},${y0 + rTR}` : `V${y0}`)
+            + `V${y1 - rBR}`
+            + (rBR ? `Q${x1},${y1} ${x1 - rBR},${y1}` : `H${x1}`)
+            + `H${x0 + rBL}`
+            + (rBL ? `Q${x0},${y1} ${x0},${y1 - rBL}` : `V${y1}`)
+            + `V${y0 + rTL}`
+            + (rTL ? `Q${x0},${y0} ${x0 + rTL},${y0}` : `H${x0}`)
+            + 'Z';
+        };
+
+        const bars = groupsEnter.merge(groups).selectAll('path.bar').data(d=>d.items, d=>d.key);
+        bars.enter().append('path').attr('class','bar')
+          .attr('d', (d)=> roundedPath(0, y(d.y1), bandWidth, Math.max(0.5, y(d.y0) - y(d.y1)), d.isTop, d.isBottom))
+          .attr('fill', (d)=>d.color)
+          .on('mouseenter', function(ev, d){
+            container.classList.add('hovering');
+            gBars.selectAll('path.bar').classed('ghost', (dd) => !(dd && dd.key === d.key));
+            const pct = d.total > 0 ? (d.value / d.total * 100) : 0;
+            tipInner.innerHTML = `
+              <div style="display:flex;align-items:center;gap:6px;margin-bottom:4px;">
+                <span class="swatch" style="background:${d.color}"></span>
+                <strong>${d.key}</strong>
+              </div>
+              <div><strong>Seq</strong> ${d.xLabel}</div>
+              <div><strong>Mem</strong> ${d.value.toFixed(1)} GB <span style="opacity:.7">(${pct.toFixed(0)}%)</span></div>
+              <div style="opacity:.7"><strong>Total</strong> ${d.total.toFixed(1)} GB</div>
+            `;
+            tip.style.opacity = '1';
+            const li = legendItems.querySelector(`.item[data-key="${d.key}"]`);
+            if (li) li.classList.add('hovered');
+            legendItems.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-key') !== d.key));
+          })
+          .on('mousemove', function(ev, d){
+            const [mx, my] = d3.pointer(ev, container);
+            const offsetX = 12, offsetY = 12;
+            const maxX = (container.clientWidth || 0) - (tip.offsetWidth + 6);
+            const maxY = (container.clientHeight || 0) - (tip.offsetHeight + 6);
+            const tx = Math.max(0, Math.min(mx + offsetX, maxX));
+            const ty = Math.max(0, Math.min(my + offsetY, maxY));
+            tip.style.transform = `translate(${Math.round(tx)}px, ${Math.round(ty)}px)`;
+          })
+          .on('mouseleave', function(){
+            tip.style.opacity='0';
+            tip.style.transform='translate(-9999px, -9999px)';
+            container.classList.remove('hovering');
+            gBars.selectAll('path.bar').classed('ghost', false).classed('highlight', false);
+            legendItems.querySelectorAll('.item').forEach(it => { it.classList.remove('hovered'); it.classList.remove('ghost'); });
+          })
+          .merge(bars)
+          .transition().duration(200)
+          .attr('d', (d)=> roundedPath(0, y(d.y1), bandWidth, Math.max(0.5, y(d.y0) - y(d.y1)), d.isTop, d.isBottom))
+          .attr('fill', (d)=>d.color);
+        bars.exit().remove();
+      }
+
+      function update(){ drawBars(); }
+
+      // Boot
+      update();
+      // controls already appended to footer; populate control groups
+      controls.appendChild(groupSize); controls.appendChild(groupRecomp);
+      selSize.addEventListener('change', (e)=>{ currentSize = e.target.value; update(); });
+      selRecomp.addEventListener('change', (e)=>{ currentMode = e.target.value; update(); });
+
+      const rerender = () => { update(); };
+      if (window.ResizeObserver) { const ro = new ResizeObserver(()=>rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/d3-benchmark.html b/app/src/content/embeds/d3-benchmark.html
new file mode 100644
index 0000000000000000000000000000000000000000..99b995dac556902cb083b35fb818571d3e19c374
--- /dev/null
+++ b/app/src/content/embeds/d3-benchmark.html
@@ -0,0 +1,434 @@
+<div class="d3-benchmark"></div>
+<style>
+  .d3-benchmark { position: relative; }
+  .d3-benchmark .controls {
+    display: flex;
+    align-items: center;
+    gap: 12px;
+    margin-bottom: 10px;
+  }
+  .d3-benchmark .controls label {
+    font-size: 12px;
+    color: var(--muted-color);
+  }
+  .d3-benchmark .controls select {
+    appearance: none;
+    -webkit-appearance: none;
+    -moz-appearance: none;
+    border: 1px solid var(--border-color);
+    border-radius: 8px;
+    padding: 6px 28px 6px 10px;
+    background-color: var(--surface-bg);
+    color: var(--text-color);
+    font-size: 13px;
+    line-height: 1.2;
+    background-image: url("data:image/svg+xml,%3Csvg width='12' height='8' viewBox='0 0 12 8' xmlns='http://www.w3.org/2000/svg'%3E%3Cpath d='M1.41 1.59L6 6.17l4.59-4.58L12 3 6 9 0 3z' fill='%23999'/%3E%3C/svg%3E");
+    background-repeat: no-repeat;
+    background-position: right 8px center;
+  }
+  .d3-benchmark .controls select:focus-visible {
+    outline: 2px solid var(--primary-color);
+    outline-offset: 2px;
+  }
+  .d3-benchmark .legend {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+    margin: 8px 0 0 0;
+  }
+  .d3-benchmark .legend .legend-title {
+    font-size: 12px;
+    font-weight: 700;
+    color: var(--text-color);
+  }
+  .d3-benchmark .legend .items {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 8px 14px;
+  }
+  .d3-benchmark .legend .item {
+    display: inline-flex;
+    align-items: center;
+    gap: 8px;
+    font-size: 12px;
+    color: var(--muted-color);
+    cursor: pointer;
+  }
+  .d3-benchmark .legend .swatch {
+    width: 14px;
+    height: 14px;
+    border-radius: 3px;
+    border: 1px solid var(--border-color);
+  }
+  .d3-benchmark .ghost { opacity: .25; }
+  .d3-benchmark .d3-tooltip {
+    position: absolute;
+    top: 0px;
+    left: 0px;
+    transform: translate(-9999px, -9999px);
+    pointer-events: none;
+    padding: 8px 10px;
+    border-radius: 8px;
+    font-size: 12px;
+    line-height: 1.35;
+    border: 1px solid var(--border-color);
+    background: var(--surface-bg);
+    color: var(--text-color);
+    box-shadow: 0 4px 24px rgba(0,0,0,.18);
+    opacity: 0;
+    transition: opacity .12s ease;
+    text-align: left;
+  }
+  .d3-benchmark .chart-card {
+    background: var(--surface-bg);
+    border: 1px solid var(--border-color);
+    border-radius: 10px;
+    padding: 8px;
+  }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) {
+        s = document.createElement('script');
+        s.id = 'd3-cdn-script';
+        s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js';
+        document.head.appendChild(s);
+      }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-benchmark'))){
+        const cs = Array.from(document.querySelectorAll('.d3-benchmark')).filter(el => !(el.dataset && el.dataset.mounted==='true'));
+        container = cs[cs.length-1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted==='true') return; container.dataset.mounted='true'; }
+
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tip.appendChild(tipInner);
+        container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // header below chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+
+      const makeLegend = (series, colorBySeries) => {
+        let legend = header.querySelector('.legend');
+        if (!legend) { legend = document.createElement('div'); legend.className = 'legend'; header.appendChild(legend); }
+        // Ensure title
+        let title = legend.querySelector('.legend-title');
+        if (!title) { title = document.createElement('div'); title.className = 'legend-title'; title.textContent = 'Legend'; legend.appendChild(title); }
+        // Ensure items container
+        let items = legend.querySelector('.items');
+        if (!items) { items = document.createElement('div'); items.className = 'items'; legend.appendChild(items); }
+        items.innerHTML = '';
+        series.forEach(name => {
+          const item = document.createElement('div'); item.className = 'item';
+          const sw = document.createElement('span'); sw.className = 'swatch'; sw.style.background = colorBySeries(name);
+          const txt = document.createElement('span'); txt.textContent = name;
+          item.appendChild(sw); item.appendChild(txt); items.appendChild(item);
+          item.addEventListener('mouseenter', () => { state.highlightModel = name; updateHighlight(); });
+          item.addEventListener('mouseleave', () => { state.highlightModel = null; updateHighlight(); });
+        });
+      };
+
+      // SVG scaffolding inside a card wrapper, then header appended after
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+
+      // No controls (fixed scale mode)
+
+      // Public-first data loading with inline fallback
+      const fetchFirstAvailable = async (paths) => {
+        for (const p of paths) {
+          try {
+            const res = await fetch(p, { cache:'no-cache' });
+            if (!res.ok) throw new Error('HTTP '+res.status);
+            const text = await res.text();
+            // Try JSON first; if CSV, parse with d3.csvParse
+            try { return JSON.parse(text); } catch(e) {}
+            if (window.d3 && d3.csvParse) { return d3.csvParse(text); }
+          } catch (e) { /* keep trying */ }
+        }
+        return null;
+      };
+
+      // Inline fallback dataset (scores in % where applicable)
+      const inlineData = [
+        { benchmark:'MMLU',       model:'GPT-4o',      score: 88 },
+        { benchmark:'MMLU',       model:'Llama 3 70B', score: 80 },
+        { benchmark:'MMLU',       model:'Mixtral 8x7B',score: 73 },
+        { benchmark:'MMLU',       model:'Gemma 2 27B', score: 76 },
+        { benchmark:'GSM8K',      model:'GPT-4o',      score: 94 },
+        { benchmark:'GSM8K',      model:'Llama 3 70B', score: 83 },
+        { benchmark:'GSM8K',      model:'Mixtral 8x7B',score: 79 },
+        { benchmark:'GSM8K',      model:'Gemma 2 27B', score: 81 },
+        { benchmark:'HellaSwag',  model:'GPT-4o',      score: 95 },
+        { benchmark:'HellaSwag',  model:'Llama 3 70B', score: 89 },
+        { benchmark:'HellaSwag',  model:'Mixtral 8x7B',score: 86 },
+        { benchmark:'HellaSwag',  model:'Gemma 2 27B', score: 87 },
+        { benchmark:'TruthfulQA', model:'GPT-4o',      score: 64 },
+        { benchmark:'TruthfulQA', model:'Llama 3 70B', score: 56 },
+        { benchmark:'TruthfulQA', model:'Mixtral 8x7B',score: 51 },
+        { benchmark:'TruthfulQA', model:'Gemma 2 27B', score: 53 },
+        { benchmark:'ARC-C',      model:'GPT-4o',      score: 79 },
+        { benchmark:'ARC-C',      model:'Llama 3 70B', score: 72 },
+        { benchmark:'ARC-C',      model:'Mixtral 8x7B',score: 68 },
+        { benchmark:'ARC-C',      model:'Gemma 2 27B', score: 70 }
+      ];
+
+      const state = {
+        data: inlineData,
+        colorsByModel: null,
+        highlightModel: null,
+      };
+
+      const margin = { top: 12, right: 28, bottom: 24, left: 56 };
+      let width = 800, height = 360;
+      const x0 = d3.scaleBand().paddingInner(0.2).paddingOuter(0.05); // group: benchmark
+      const x1 = d3.scaleBand().padding(0.12); // series: model per benchmark
+      const y = d3.scaleLinear();
+      const xAxis = d3.axisBottom(x0).tickSizeOuter(0);
+      const yAxis = d3.axisLeft(y).ticks(6).tickSizeOuter(0);
+      const yTopPadding = 2; // avoid bars touching top at max
+
+      function getPrimaryColor(){
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getPrimary === 'function') return window.ColorPalettes.getPrimary(); } catch(e) {}
+        return getComputedStyle(document.documentElement).getPropertyValue('--primary-color') || '#6D4AFF';
+      }
+      function getCategoricalColors(n){
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', n); } catch(e) {}
+        // Fallback: generate hues around the primary color (simple fallback)
+        const base = getPrimaryColor();
+        const colors = [];
+        for (let i=0;i<n;i++) {
+          const hue = Math.round((360/n)*i);
+          colors.push(`hsl(${hue}, 60%, 55%)`);
+        }
+        return colors;
+      }
+
+      function computeSeriesColors(models){
+        const palette = getCategoricalColors(models.length);
+        const map = new Map(models.map((m, i) => [m, palette[i % palette.length]]));
+        return (model) => map.get(model) || getPrimaryColor();
+      }
+
+      function getModels(data){
+        return Array.from(new Set(data.map(d => d.model)));
+      }
+      function getBenchmarks(data){
+        return Array.from(new Set(data.map(d => d.benchmark)));
+      }
+
+      function updateSize(){
+        width = container.clientWidth || 800;
+        height = Math.max(240, Math.round(width / 3.4));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        return { innerWidth: width - margin.left - margin.right, innerHeight: height - margin.top - margin.bottom };
+      }
+
+      function showTip(html, x, y){
+        tip.style.transform = `translate(${x + 12}px, ${y + 12}px)`;
+        tip.style.opacity = '1';
+        const inner = tip.querySelector('.d3-tooltip__inner') || tip;
+        inner.innerHTML = html;
+      }
+      function hideTip(){
+        tip.style.opacity = '0';
+        tip.style.transform = 'translate(-9999px, -9999px)';
+      }
+
+      function updateHighlight(){
+        const model = state.highlightModel;
+        const bars = gRoot.selectAll('rect.bar');
+        const labels = gRoot.selectAll('text.value');
+        if (model) {
+          bars.classed('ghost', d => d.model !== model);
+          labels.classed('ghost', d => d.model !== model);
+          const items = container.querySelectorAll('.legend .item');
+          items.forEach((el) => {
+            const name = el.textContent.trim();
+            if (name !== model) el.classList.add('ghost'); else el.classList.remove('ghost');
+          });
+        } else {
+          bars.classed('ghost', false);
+          labels.classed('ghost', false);
+          container.querySelectorAll('.legend .item').forEach(el => el.classList.remove('ghost'));
+        }
+      }
+
+      function render(){
+        const { innerWidth, innerHeight } = updateSize();
+        const models = getModels(state.data);
+        if (!state.colorsByModel) state.colorsByModel = computeSeriesColors(models);
+        makeLegend(models, state.colorsByModel);
+
+        x0.domain(getBenchmarks(state.data)).range([0, innerWidth]);
+        x1.domain(models).range([0, x0.bandwidth()]);
+
+        const yMaxRaw = 100;
+        const yMax = yMaxRaw + yTopPadding;
+        y.domain([0, yMax]).range([innerHeight, 0]).nice();
+
+        // Axes (standardized colors)
+        gRoot
+          .selectAll('.axis-x')
+          .data([0])
+          .join('g')
+          .attr('class','axis-x')
+          .attr('transform',`translate(0,${innerHeight})`)
+          .call(xAxis)
+          .call(g => {
+            g.selectAll('path, line').attr('stroke', 'var(--axis-color)');
+            g.selectAll('text').attr('fill', 'var(--tick-color)').style('font-size','12px');
+          });
+        gRoot
+          .selectAll('.axis-y')
+          .data([0])
+          .join('g')
+          .attr('class','axis-y')
+          .call(yAxis)
+          .call(g => {
+            g.selectAll('path, line').attr('stroke', 'var(--axis-color)');
+            g.selectAll('text').attr('fill', 'var(--tick-color)').style('font-size','12px');
+          });
+
+        // Gridlines (y) standardized color
+        gRoot
+          .selectAll('.grid-y')
+          .data([0])
+          .join('g')
+          .attr('class','grid-y')
+          .call(d3.axisLeft(y).ticks(6).tickSize(-innerWidth).tickFormat(''))
+          .call(g => g.select('.domain').remove())
+          .call(g => g.selectAll('.tick line').attr('stroke','var(--grid-color)').attr('stroke-opacity',1))
+          .call(g => g.selectAll('.tick').filter((d, i, nodes) => i === nodes.length - 1).select('line').attr('stroke-opacity', 0));
+
+        // Groups per benchmark
+        const groups = gRoot.selectAll('.group').data(getBenchmarks(state.data), d => d);
+        const groupsEnter = groups.enter().append('g').attr('class','group');
+        groupsEnter.merge(groups).attr('transform', d => `translate(${x0(d)},0)`);
+        groups.exit().remove();
+
+        // Bars per model
+        const nested = d3.group(state.data, d => d.benchmark);
+        groupsEnter.each(function(bench){ d3.select(this).selectAll('rect.bar').data([]).join('rect'); });
+        const allGroups = gRoot.selectAll('.group');
+        allGroups.each(function(bench){
+          const dataForBench = nested.get(bench) || [];
+          const bars = d3.select(this).selectAll('rect.bar').data(models.map(m => ({ bench, model:m, score:(dataForBench.find(dd=>dd.model===m)||{score:0}).score })) , d => d.model);
+          bars.join(
+            enter => enter.append('rect')
+              .attr('class','bar')
+              .attr('x', d => x1(d.model))
+              .attr('y', innerHeight)
+              .attr('width', x1.bandwidth())
+              .attr('height', 0)
+              .attr('fill', d => state.colorsByModel(d.model))
+              .on('mouseenter', (event, d) => { state.highlightModel = d.model; updateHighlight(); })
+              .on('mousemove', (event, d) => {
+                const [mx, my] = d3.pointer(event, container);
+                showTip(`<strong>${d.model}</strong><br/>${d.bench}: <strong>${d.score}</strong>`, mx, my);
+              })
+              .on('mouseleave', () => { hideTip(); state.highlightModel = null; updateHighlight(); })
+              .transition().duration(160)
+              .attr('y', d => y(d.score))
+              .attr('height', d => Math.max(0, innerHeight - y(d.score))),
+            update => update
+              .on('mouseenter', (event, d) => { state.highlightModel = d.model; updateHighlight(); })
+              .on('mousemove', (event, d) => {
+                const [mx, my] = d3.pointer(event, container);
+                showTip(`<strong>${d.model}</strong><br/>${d.bench}: <strong>${d.score}</strong>`, mx, my);
+              })
+              .on('mouseleave', () => { hideTip(); state.highlightModel = null; updateHighlight(); })
+              .transition().duration(160)
+              .attr('x', d => x1(d.model))
+              .attr('y', d => y(d.score))
+              .attr('width', x1.bandwidth())
+              .attr('height', d => Math.max(0, innerHeight - y(d.score)))
+              .attr('fill', d => state.colorsByModel(d.model)),
+            exit => exit.transition().duration(120).attr('y', innerHeight).attr('height', 0).remove()
+          );
+
+          // Value labels centered above bars (small, darker)
+          const labels = d3.select(this).selectAll('text.value').data(models.map(m => ({ bench, model:m, score:(dataForBench.find(dd=>dd.model===m)||{score:0}).score })) , d => d.model);
+          labels.join(
+            enter => enter.append('text')
+              .attr('class','value')
+              .attr('x', d => x1(d.model) + x1.bandwidth()/2)
+              .attr('y', d => y(d.score) - 4)
+              .attr('text-anchor','middle')
+              .attr('fill','var(--text-color)')
+              .attr('opacity',0.9)
+              .attr('font-size',10)
+              .text(d => d.score),
+            update => update
+              .transition().duration(160)
+              .attr('x', d => x1(d.model) + x1.bandwidth()/2)
+              .attr('y', d => y(d.score) - 4)
+              .text(d => d.score),
+            exit => exit.remove()
+          );
+        });
+
+        // Axis labels
+        gRoot.selectAll('.y-label').data([0]).join('text').attr('class','y-label')
+          .attr('transform', `rotate(-90)`) 
+          .attr('x', -innerHeight / 2)
+          .attr('y', -margin.left + 24)
+          .attr('text-anchor','middle')
+          .attr('fill','var(--text-color)')
+          .attr('font-size',12)
+          .attr('font-weight',700)
+          .text('score');
+      }
+
+      // Initial render + resize handling
+      render();
+      const rerender = () => render();
+      if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); }
+      else { window.addEventListener('resize', rerender); }
+
+      // Attempt to load external data (public-first). Expect either JSON array with {benchmark, model, score}
+      (async () => {
+        const maybe = await fetchFirstAvailable([
+          '/data/llm_benchmarks.json',
+          './assets/data/llm_benchmarks.json',
+          '../assets/data/llm_benchmarks.json'
+        ]);
+        if (Array.isArray(maybe) && maybe.length && maybe[0].benchmark && maybe[0].model && (typeof maybe[0].score === 'number')) {
+          state.data = maybe;
+          state.colorsByModel = null; // recompute in case of different model set
+          render();
+        } else if (maybe && maybe.columns) {
+          // CSV parsed via d3.csvParse -> convert fields
+          const parsed = maybe.map(r => ({ benchmark: r.benchmark, model: r.model, score: +r.score }));
+          if (parsed.length) { state.data = parsed; state.colorsByModel = null; render(); }
+        }
+      })().catch(() => {
+        // Graceful failure: inline fallback already rendered
+      });
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); }
+    else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/d3-confusion-matrix.html b/app/src/content/embeds/d3-confusion-matrix.html
new file mode 100644
index 0000000000000000000000000000000000000000..944807d8cadc0e37db2bd6d04b48fb9f2bcb1b6e
--- /dev/null
+++ b/app/src/content/embeds/d3-confusion-matrix.html
@@ -0,0 +1,516 @@
+<div class="d3-confusion-matrix"  ></div>
+<style>
+  .d3-confusion-matrix {
+    position: relative;
+  }
+  .d3-confusion-matrix .panels {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 16px;
+    margin-bottom: 4px;
+  }
+  .d3-confusion-matrix .panel {
+    flex: 1 1 320px;
+    min-width: 280px;
+  }
+  .d3-confusion-matrix .panel__title {
+    color: var(--text-color);
+    font-size: 12px;
+    line-height: 1.35;
+    margin: 0 0 6px 0;
+    font-weight: 600;
+  }
+  .d3-confusion-matrix .axis-label {
+    fill: var(--text-color);
+    font-size: 11px;
+    font-weight: 700;
+  }
+  .d3-confusion-matrix .cell-border {
+    stroke: var(--border-color);
+    stroke-width: 1px;
+    fill: none;
+  }
+  .d3-confusion-matrix .cell-text {
+    fill: var(--muted-color);
+    font-size: 11px;
+    pointer-events: none;
+  }
+  .d3-confusion-matrix .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+</style>
+<script>
+  (() => {
+    // Load D3 from CDN once
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) {
+        s = document.createElement('script');
+        s.id = 'd3-cdn-script';
+        s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js';
+        document.head.appendChild(s);
+      }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-confusion-matrix'))){
+        const cs = Array.from(document.querySelectorAll('.d3-confusion-matrix')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) {
+        if (container.dataset.mounted === 'true') return;
+        container.dataset.mounted = 'true';
+      }
+
+      // Tooltip (HTML, single instance inside container)
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip');
+      let tipInner;
+      if (!tip) {
+        tip = document.createElement('div');
+        tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position: 'absolute',
+          top: '0px',
+          left: '0px',
+          transform: 'translate(-9999px, -9999px)',
+          pointerEvents: 'none',
+          padding: '8px 10px',
+          borderRadius: '8px',
+          fontSize: '12px',
+          lineHeight: '1.35',
+          border: '1px solid var(--border-color)',
+          background: 'var(--surface-bg)',
+          color: 'var(--text-color)',
+          boxShadow: '0 4px 24px rgba(0,0,0,.18)',
+          opacity: '0',
+          transition: 'opacity .12s ease'
+        });
+        tipInner = document.createElement('div');
+        tipInner.className = 'd3-tooltip__inner';
+        tipInner.style.textAlign = 'left';
+        tip.appendChild(tipInner);
+        container.appendChild(tip);
+      } else {
+        tipInner = tip.querySelector('.d3-tooltip__inner') || tip;
+      }
+
+      // Panels container (two side-by-side matrices)
+      const panels = document.createElement('div');
+      panels.className = 'panels';
+      const panelA = document.createElement('div');
+      panelA.className = 'panel';
+      const titleA = document.createElement('div'); titleA.className = 'panel__title'; titleA.textContent = 'Baseline (row-normalized %)';
+      panelA.appendChild(titleA);
+      const mountA = document.createElement('div'); panelA.appendChild(mountA);
+      const panelB = document.createElement('div');
+      panelB.className = 'panel';
+      const titleB = document.createElement('div'); titleB.className = 'panel__title'; titleB.textContent = 'Delta (Improved − Baseline, pp)';
+      panelB.appendChild(titleB);
+      const mountB = document.createElement('div'); panelB.appendChild(mountB);
+      panels.appendChild(panelA);
+      panels.appendChild(panelB);
+      container.appendChild(panels);
+
+      // SVG scaffolding
+      const cardA = document.createElement('div'); cardA.className = 'chart-card'; mountA.appendChild(cardA);
+      const svgA = d3.select(cardA).append('svg').attr('width', '100%').style('display', 'block');
+      const gRootA = svgA.append('g');
+      const gCellsA = gRootA.append('g');
+      const gAxesA = gRootA.append('g');
+      const cardB = document.createElement('div'); cardB.className = 'chart-card'; mountB.appendChild(cardB);
+      const svgB = d3.select(cardB).append('svg').attr('width', '100%').style('display', 'block');
+      const gRootB = svgB.append('g');
+      const gCellsB = gRootB.append('g');
+      const gAxesB = gRootB.append('g');
+
+      // Demo data (two distinct 10x10 confusion matrices: Baseline vs Improved)
+      // Rows: actual, Columns: predicted
+      const classes = ['0','1','2','3','4','5','6','7','8','9'];
+      const matrixA = [
+        [90,  2,  1,  0,  0,  0,  1,  0,  5,  1],
+        [ 3, 85,  5,  1,  0,  1,  2,  1,  1,  1],
+        [ 1,  6, 70, 10,  4,  4,  1,  1,  1,  2],
+        [ 0,  1,  8, 65, 10, 10,  2,  1,  1,  2],
+        [ 0,  0,  2,  6, 83,  3,  1,  1,  3,  1],
+        [ 0,  1,  2, 12,  4, 70,  5,  2,  2,  2],
+        [ 1,  2,  1,  0,  1,  2, 88,  1,  3,  1],
+        [ 0,  1,  1,  1,  1,  1,  2, 90,  1,  2],
+        [ 6,  2,  2,  4,  6,  3,  3,  2, 70,  2],
+        [ 1,  1,  1,  1,  2,  1,  1,  2,  1, 89]
+      ];
+      const matrixB = [
+        [94,  1,  0,  0,  0,  0,  1,  0,  3,  1],
+        [ 2, 90,  3,  1,  0,  0,  1,  1,  1,  1],
+        [ 1,  4, 78,  7,  3,  3,  1,  1,  1,  1],
+        [ 0,  1,  5, 74,  7,  8,  1,  1,  1,  2],
+        [ 0,  0,  1,  4, 88,  2,  1,  1,  2,  1],
+        [ 0,  1,  1,  9,  3, 78,  3,  1,  2,  2],
+        [ 1,  1,  1,  0,  1,  1, 91,  1,  2,  1],
+        [ 0,  1,  1,  1,  1,  1,  1, 92,  1,  1],
+        [ 4,  1,  1,  3,  4,  2,  2,  2, 79,  2],
+        [ 1,  1,  1,  1,  2,  1,  1,  1,  1, 90]
+      ];
+
+      // Colors: sequential palette via window.ColorPalettes with graceful fallback
+      const getSequentialColors = (count) => {
+        try {
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            return window.ColorPalettes.getColors('sequential', count);
+          }
+        } catch (_) {}
+        // Fallback: generate a monochrome scale using the primary color with varying opacity
+        const arr = [];
+        for (let i = 0; i < count; i++) arr.push('var(--primary-color)');
+        return arr;
+      };
+
+      const palette = getSequentialColors(13);
+      const getDivergingColors = (count) => {
+        try {
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            return window.ColorPalettes.getColors('diverging', count);
+          }
+        } catch (_) {}
+        const steps = Math.max(3, count|0);
+        const arr = [];
+        for (let i = 0; i < steps; i++) {
+          const t = i / (steps - 1);
+          const pct = Math.round(t * 100);
+          arr.push(`color-mix(in srgb, #D64545 ${100-pct}%, #3A7BD5 ${pct}%)`);
+        }
+        return arr;
+      };
+
+      let width = 800;
+      let height = 480;
+      const margin = { top: 36, right: 24, bottom: 26, left: 56 };
+
+      function updateSize() {
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        width = container.clientWidth || 800;
+        const gap = 16; // matches CSS .panels gap
+        const minPanel = 320;
+        const nCols = (width >= (minPanel * 2 + gap)) ? 2 : 1;
+        const panelWidth = nCols === 2 ? Math.max(minPanel, Math.floor((width - gap) / 2)) : Math.max(minPanel, width);
+        const base = Math.max(minPanel, Math.round(panelWidth * 0.92));
+        height = base;
+        // Responsive SVG: width 100%, height auto, preserve aspect via viewBox
+        svgA
+          .attr('viewBox', `0 0 ${panelWidth} ${height}`)
+          .attr('preserveAspectRatio', 'xMidYMid meet')
+          .style('width', '100%')
+          .style('height', 'auto');
+        svgB
+          .attr('viewBox', `0 0 ${panelWidth} ${height}`)
+          .attr('preserveAspectRatio', 'xMidYMid meet')
+          .style('width', '100%')
+          .style('height', 'auto');
+        gRootA.attr('transform', `translate(${margin.left},${margin.top})`);
+        gRootB.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = panelWidth - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        return { innerWidth, innerHeight, isDark };
+      }
+
+      function computeValues(normalization, matrix) {
+        const n = classes.length;
+        const totalsByRow = matrix.map(row => row.reduce((a, b) => a + b, 0));
+        const flat = [];
+        let minV = Infinity, maxV = -Infinity;
+        for (let r = 0; r < n; r++) {
+          for (let c = 0; c < n; c++) {
+            const count = matrix[r][c];
+            const value = normalization === 'row' ? (totalsByRow[r] ? count / totalsByRow[r] : 0) : count;
+            if (value < minV) minV = value;
+            if (value > maxV) maxV = value;
+            flat.push({ r, c, count, value });
+          }
+        }
+        return { data: flat, minV, maxV };
+      }
+
+      function getColorScale(values, minV, maxV) {
+        // If ColorPalettes is available, use quantiles to enhance visual variation across the distribution
+        const hasPalette = !(palette.length === 0);
+        if (hasPalette && (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function')) {
+          const scale = d3.scaleQuantile().domain(values).range(palette);
+          return (v) => scale(v);
+        }
+        // Fallback: primary color with opacity mapped to normalized value
+        const norm = d3.scaleLinear().domain([minV, maxV]).range([0.08, 0.9]).clamp(true);
+        return (v) => `color-mix(in oklab, var(--primary-color) ${Math.round(norm(v) * 100)}%, var(--surface-bg))`;
+      }
+
+      // (no local contrast function — use ColorPalettes.getTextStyleForBackground)
+
+      // Compute a fixed readable text color from a CSS rgb()/rgba() string
+      function chooseFixedReadableTextOnBg(bgCss){
+        try {
+          const m = String(bgCss||'').match(/rgba?\(([^)]+)\)/);
+          if (!m) return '#0e1116';
+          const parts = m[1].split(',').map(s => parseFloat(s.trim()));
+          const [r, g, b] = parts;
+          // sRGB → relative luminance
+          const srgb = [r, g, b].map(v => Math.max(0, Math.min(255, v)) / 255);
+          const linear = srgb.map(c => (c <= 0.03928 ? c/12.92 : Math.pow((c + 0.055)/1.055, 2.4)));
+          const L = 0.2126*linear[0] + 0.7152*linear[1] + 0.0722*linear[2];
+          // Threshold ~ 0.5 for readability; darker BG → white text, else near-black
+          return L < 0.5 ? '#ffffff' : '#0e1116';
+        } catch(_) { return '#0e1116'; }
+      }
+
+      function render() {
+        const { innerWidth, innerHeight } = updateSize();
+        const n = classes.length;
+        const gridSize = Math.min(innerWidth, innerHeight);
+        const cellSize = gridSize / n;
+
+        const x = d3.scaleBand().domain(d3.range(n)).range([0, gridSize]).paddingInner(0.06);
+        const y = d3.scaleBand().domain(d3.range(n)).range([0, gridSize]).paddingInner(0.06);
+
+        // Panel A: Baseline (row-normalized)
+        const dataA = computeValues('row', matrixA);
+        const colorA = getColorScale(dataA.data.map(d => d.value), dataA.minV, dataA.maxV);
+
+        gCellsA.selectAll('rect.cell-bg')
+          .data([0])
+          .join('rect')
+          .attr('class', 'cell-bg')
+          .attr('x', 0)
+          .attr('y', 0)
+          .attr('width', gridSize)
+          .attr('height', gridSize)
+          .attr('fill', 'none')
+          .attr('stroke', 'var(--border-color)')
+          .attr('stroke-width', 1);
+
+        const cellsA = gCellsA.selectAll('g.cell')
+          .data(dataA.data, d => `${d.r}-${d.c}-A`);
+
+        const cellsEnterA = cellsA.enter()
+          .append('g')
+          .attr('class', 'cell');
+
+        cellsEnterA.append('rect')
+          .attr('rx', 2)
+          .attr('ry', 2)
+          .on('mousemove', (event, d) => {
+            const [px, py] = d3.pointer(event, container);
+            tipInner.innerHTML = `<strong>${classes[d.r]}</strong> → <strong>${classes[d.c]}</strong><br/>${(d.value * 100).toFixed(1)}% (${d.count})`;
+            tip.style.transform = `translate(${px + 10}px, ${py + 10}px)`;
+            tip.style.opacity = '1';
+          })
+          .on('mouseleave', () => {
+            tip.style.opacity = '0';
+          });
+
+        cellsEnterA.append('text')
+          .attr('class', 'cell-text')
+          .attr('text-anchor', 'middle')
+          .attr('dominant-baseline', 'middle');
+
+        const cellsMergedA = cellsEnterA.merge(cellsA);
+
+        cellsMergedA.select('rect')
+          .attr('x', d => x(d.c))
+          .attr('y', d => y(d.r))
+          .attr('width', Math.max(1, x.bandwidth()))
+          .attr('height', Math.max(1, y.bandwidth()))
+          .attr('fill', d => colorA(d.value));
+
+        cellsMergedA.select('text')
+          .attr('x', d => x(d.c) + x.bandwidth() / 2)
+          .attr('y', d => y(d.r) + y.bandwidth() / 2)
+          .text(d => `${Math.round(d.value * 100)}`)
+          .style('fill', function(d){
+            try {
+              const rect = this && this.parentNode ? this.parentNode.querySelector('rect') : null;
+              const bg = rect ? getComputedStyle(rect).fill : colorA(d.value);
+              return chooseFixedReadableTextOnBg(bg);
+            } catch (_) {
+              return '#0e1116';
+            }
+          });
+
+        cellsA.exit().remove();
+
+        gAxesA.selectAll('*').remove();
+
+        gAxesA.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', (_, i) => x(i) + x.bandwidth() / 2)
+          .attr('y', -8)
+          .text(d => d);
+
+        gAxesA.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'end')
+          .attr('x', -8)
+          .attr('y', (_, i) => y(i) + y.bandwidth() / 2)
+          .attr('dominant-baseline', 'middle')
+          .text(d => d);
+
+        gAxesA.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', gridSize / 2)
+          .attr('y', innerHeight + 20)
+          .text('Predicted');
+
+        gAxesA.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('transform', `translate(${-40}, ${gridSize / 2}) rotate(-90)`)
+          .text('Actual');
+
+        // Panel B: Delta (Improved − Baseline), row-normalized differences in percentage points
+        const dataB = computeValues('row', matrixB);
+        const diverging = getDivergingColors(13);
+        // Build delta values aligned to A's ordering
+        const mapA = new Map(dataA.data.map(d => [d.r + '-' + d.c, d.value]));
+        const delta = dataB.data.map(d => ({ r: d.r, c: d.c, count: d.count, value: (d.value - (mapA.get(d.r + '-' + d.c) || 0)) }));
+        // Symmetric domain around 0 (in proportions), express later as pp in labels
+        const maxAbsDelta = Math.max(0.01, d3.max(delta, d => Math.abs(d.value)) || 0.01);
+        const colorB = d3.scaleQuantize().domain([-maxAbsDelta, maxAbsDelta]).range(diverging);
+
+        gCellsB.selectAll('rect.cell-bg')
+          .data([0])
+          .join('rect')
+          .attr('class', 'cell-bg')
+          .attr('x', 0)
+          .attr('y', 0)
+          .attr('width', gridSize)
+          .attr('height', gridSize)
+          .attr('fill', 'none')
+          .attr('stroke', 'var(--border-color)')
+          .attr('stroke-width', 1);
+
+        const cellsB = gCellsB.selectAll('g.cell')
+          .data(dataB.data, d => `${d.r}-${d.c}-B`);
+
+        const cellsEnterB = cellsB.enter()
+          .append('g')
+          .attr('class', 'cell');
+
+        cellsEnterB.append('rect')
+          .attr('rx', 2)
+          .attr('ry', 2)
+          .on('mousemove', (event, d) => {
+            const [px, py] = d3.pointer(event, container);
+            const a = dataA.data.find(x => x.r===d.r && x.c===d.c);
+            const b = dataB.data.find(x => x.r===d.r && x.c===d.c);
+            const dv = ((b ? b.value : 0) - (a ? a.value : 0)) * 100;
+            tipInner.innerHTML = `<strong>${classes[d.r]}</strong> → <strong>${classes[d.c]}</strong>` +
+              `<br/>baseline ${(a ? a.value*100 : 0).toFixed(1)}%` +
+              `<br/>improved ${(b ? b.value*100 : 0).toFixed(1)}%` +
+              `<br/>delta ${dv.toFixed(1)} pp`;
+            tip.style.transform = `translate(${px + 10}px, ${py + 10}px)`;
+            tip.style.opacity = '1';
+          })
+          .on('mouseleave', () => {
+            tip.style.opacity = '0';
+          });
+
+        cellsEnterB.append('text')
+          .attr('class', 'cell-text')
+          .attr('text-anchor', 'middle')
+          .attr('dominant-baseline', 'middle');
+
+        const cellsMergedB = cellsEnterB.merge(cellsB);
+
+        cellsMergedB.select('rect')
+          .attr('x', d => x(d.c))
+          .attr('y', d => y(d.r))
+          .attr('width', Math.max(1, x.bandwidth()))
+          .attr('height', Math.max(1, y.bandwidth()))
+          .attr('fill', d => colorB(delta.find(x => x.r===d.r && x.c===d.c).value));
+
+        cellsMergedB.select('text')
+          .attr('x', d => x(d.c) + x.bandwidth() / 2)
+          .attr('y', d => y(d.r) + y.bandwidth() / 2)
+          .text(d => {
+            const dv = delta.find(x => x.r===d.r && x.c===d.c).value; return `${Math.round(dv * 100)}`;
+          })
+          .style('fill', function(d){
+            try {
+              const rect = this && this.parentNode ? this.parentNode.querySelector('rect') : null;
+              const dv = delta.find(x => x.r===d.r && x.c===d.c).value;
+              const bg = rect ? getComputedStyle(rect).fill : colorB(dv);
+              return chooseFixedReadableTextOnBg(bg);
+            } catch (_) {
+              return '#0e1116';
+            }
+          });
+
+        cellsB.exit().remove();
+
+        gAxesB.selectAll('*').remove();
+
+        gAxesB.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', (_, i) => x(i) + x.bandwidth() / 2)
+          .attr('y', -8)
+          .text(d => d);
+
+        gAxesB.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'end')
+          .attr('x', -8)
+          .attr('y', (_, i) => y(i) + y.bandwidth() / 2)
+          .attr('dominant-baseline', 'middle')
+          .text(d => d);
+
+        gAxesB.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', gridSize / 2)
+          .attr('y', innerHeight + 20)
+          .text('Predicted');
+
+        gAxesB.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('transform', `translate(${-40}, ${gridSize / 2}) rotate(-90)`)
+          .text('Actual');
+      }
+
+      // Initial render + resize handling
+      render();
+      const rerender = () => render();
+      if (window.ResizeObserver) {
+        const ro = new ResizeObserver(() => rerender());
+        ro.observe(container);
+      } else {
+        window.addEventListener('resize', rerender);
+      }
+    };
+
+    if (document.readyState === 'loading') {
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true });
+    } else {
+      ensureD3(bootstrap);
+    }
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/d3-evals-after-fix.html b/app/src/content/embeds/d3-evals-after-fix.html
new file mode 100644
index 0000000000000000000000000000000000000000..529f311c6a592a5a7711077ad26c994fedfec681
--- /dev/null
+++ b/app/src/content/embeds/d3-evals-after-fix.html
@@ -0,0 +1,400 @@
+<div class="d3-evals-after-fix"></div>
+<style>
+  .d3-evals-after-fix { position: relative; }
+  .d3-evals-after-fix .controls {
+    margin-top: 0;
+    display: flex;
+    gap: 16px;
+    align-items: center;
+    justify-content: flex-end;
+    width: auto;
+    flex-wrap: wrap;
+  }
+  .d3-evals-after-fix .controls label {
+    font-size: 12px;
+    color: var(--text-color);
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    white-space: nowrap;
+    font-weight: 700;
+  }
+  .d3-evals-after-fix .controls select {
+    font-size: 12px;
+    padding: 8px 28px 8px 10px;
+    border: 1px solid var(--border-color);
+    border-radius: 8px;
+    background-color: var(--surface-bg);
+    color: var(--text-color);
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+    background-repeat: no-repeat; background-position: right 8px center; background-size: 12px;
+    -webkit-appearance: none; appearance: none; cursor: pointer; transition: border-color .15s ease, box-shadow .15s ease;
+  }
+  [data-theme="dark"] .d3-evals-after-fix .controls select {
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+  }
+  .d3-evals-after-fix .controls select:hover { border-color: var(--primary-color); }
+  .d3-evals-after-fix .controls select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+  .d3-evals-after-fix .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .d3-evals-after-fix .axes path, .d3-evals-after-fix .axes line { stroke: var(--axis-color); }
+  .d3-evals-after-fix .axes text { fill: var(--tick-color); }
+  .d3-evals-after-fix .grid line { stroke: var(--grid-color); }
+  .d3-evals-after-fix .legend { font-size: 12px; color: var(--text-color);padding-left: 6px; }
+  .d3-evals-after-fix .legend .items { display:flex; flex-wrap:wrap; gap:8px 12px; align-items:center; }
+  .d3-evals-after-fix .legend .item { display:flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-evals-after-fix .legend .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  /* Ghosting on hover */
+  .d3-evals-after-fix.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .d3-evals-after-fix.hovering .lines path.ghost { opacity: .25; }
+  .d3-evals-after-fix.hovering .points circle.ghost { opacity: .25; }
+  .d3-evals-after-fix.hovering .areas path.ghost { opacity: .08; }
+  .d3-evals-after-fix .chart-header { display:flex; align-items:center; justify-content:space-between; gap:12px; margin: 0 0 8px 0; flex-wrap: wrap; }
+  .d3-evals-after-fix .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .d3-evals-after-fix .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .d3-evals-after-fix .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-evals-after-fix .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .d3-evals-after-fix .lines path.active { stroke-width: 3; }
+  /* Layout tweaks: stack label above select, add legend title above items */
+  .d3-evals-after-fix .controls .control-group {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-evals-after-fix .legend-bottom {
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-evals-after-fix .legend-bottom .legend-title {
+    font-size: 12px;
+    font-weight: 700;
+    color: var(--text-color);
+  }
+  /* Tooltip styling aligned with filters-quad */
+  .d3-evals-after-fix .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .d3-evals-after-fix .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .d3-evals-after-fix .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .d3-evals-after-fix .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .d3-evals-after-fix .d3-tooltip__inner > div:nth-child(n+3) { padding-top: 6px; border-top: 1px solid var(--border-color); }
+  .d3-evals-after-fix .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+  /* Chart card only around the SVG */
+  .d3-evals-after-fix .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  /* Place header below chart and align start */
+  .d3-evals-after-fix .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+</style>
+<script>
+  (() => {
+    // Pretty label mapping for metric keys
+    const prettyMetricLabel = (key) => {
+      if (!key) return '';
+      const table = {
+        'hellaswag': 'HellaSwag',
+        'mmlu': 'MMLU',
+        'arc': 'ARC',
+        'truthfulqa': 'TruthfulQA',
+        'gsm8k': 'GSM8K',
+        'winogrande': 'WinoGrande',
+        'openbookqa': 'OpenBookQA',
+        'piqa': 'PIQA',
+        'race': 'RACE',
+        'boolq': 'BoolQ',
+        'cb': 'CB',
+        'copa': 'COPA',
+        'multirc': 'MultiRC',
+        'record': 'ReCoRD',
+        'rte': 'RTE',
+        'wic': 'WiC',
+        'wsc': 'WSC'
+      };
+      if (table[key]) return table[key];
+      const cleaned = String(key).replace(/[_-]+/g, ' ').trim();
+      return cleaned.split(/\s+/).map(w => {
+        if (/^(mmlu|arc|gsm8k|piqa|race|boolq|multirc|record|wsc)$/i.test(w)) return w.toUpperCase();
+        return w.charAt(0).toUpperCase() + w.slice(1);
+      }).join(' ');
+    };
+
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-evals-after-fix'))){
+        const cs = Array.from(document.querySelectorAll('.d3-evals-after-fix')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Controls (we will place them in a footer below the chart)
+      const controls = document.createElement('div');
+      controls.className = 'controls';
+      const controlGroup = document.createElement('div');
+      controlGroup.className = 'control-group';
+      const labelMetric = document.createElement('label');
+      labelMetric.textContent = 'Metric';
+      const selectMetric = document.createElement('select');
+      // Associate label and select with a unique id
+      const uniqueId = Math.random().toString(36).slice(2, 9);
+      selectMetric.id = `metric-select-${uniqueId}`;
+      labelMetric.setAttribute('for', selectMetric.id);
+      controlGroup.appendChild(labelMetric);
+      controlGroup.appendChild(selectMetric);
+      controls.appendChild(controlGroup);
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend + controls) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+      header.appendChild(controls);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gAreas = gRoot.append('g').attr('class','areas');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      // (legend removed from inside SVG)
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 56 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.tokens)).y(d => yScale(d.value));
+      const dataByMetric = new Map();
+      let runOrder = [];
+
+      // Colors
+      function getRunColors(count){
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', count); } catch(_){}
+        return d3.schemeTableau10 ? d3.schemeTableau10.slice(0, count) : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'].slice(0, count);
+      }
+      
+      // Format helper for tokens (convert to billions)
+      function formatTokens(v){
+        const billions = v / 1e9;
+        return d3.format('.0f')(billions) + 'B';
+      }
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(metricKey){
+        const { innerWidth, innerHeight } = updateLayout();
+        const map = dataByMetric.get(metricKey) || {};
+        const runs = runOrder;
+        // domains
+        let minTokens = Infinity, maxTokens = -Infinity, minV = Infinity, maxV = -Infinity;
+        runs.forEach(r => { (map[r]||[]).forEach(pt => { minTokens = Math.min(minTokens, pt.tokens); maxTokens = Math.max(maxTokens, pt.tokens); minV = Math.min(minV, pt.value); maxV = Math.max(maxV, pt.value); }); });
+        if (!isFinite(minTokens) || !isFinite(maxTokens)) return;
+        xScale.domain([minTokens, maxTokens]).range([0, innerWidth]);
+        yScale.domain([minV, maxV]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatTokens)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Tokens (B)');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-44}, ${innerHeight/2}) rotate(-90)`).text('Score');
+
+        // lines
+        const series = runs.map((r, i) => ({ run:r, color: getRunColors(runs.length)[i % getRunColors(runs.length).length], values: (map[r]||[]).slice().sort((a,b)=>a.tokens-b.tokens) }));
+        const paths = gLines.selectAll('path.run').data(series, d=>d.run);
+        const pathsEnter = paths.enter().append('path').attr('class','run').attr('fill','none').attr('stroke-width',2).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        pathsEnter.merge(paths).transition().duration(200).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        paths.exit().remove();
+
+        // Hover capture paths (wider invisible stroke for easy hover)
+        const captures = gLines.selectAll('path.run-hover').data(series, d=>`cap-${d.run}`);
+        captures.enter().append('path').attr('class','run-hover').attr('fill','none').attr('stroke','transparent').attr('stroke-width', 12).style('pointer-events','stroke')
+          .attr('d', d=>lineGen(d.values))
+          .merge(captures)
+          .attr('d', d=>lineGen(d.values))
+          .on('mouseenter', function(ev, d){
+            container.classList.add('hovering');
+            // ghost non hovered lines and points
+            gLines.selectAll('path.run').classed('ghost', s => s.run !== d.run);
+            gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== d.run);
+            // ghost legend items
+            try {
+              const legendNode = legendBottom;
+              if (legendNode) {
+                legendNode.querySelectorAll('.item').forEach(el => {
+                  const name = el.getAttribute('data-run');
+                  el.classList.toggle('ghost', name !== d.run);
+                });
+              }
+            } catch {}
+          })
+          .on('mouseleave', function(){
+            container.classList.remove('hovering');
+            gLines.selectAll('path.run').classed('ghost', false);
+            gPoints.selectAll('circle.pt').classed('ghost', false);
+            try { const legendNode = legendBottom; if (legendNode) legendNode.querySelectorAll('.item').forEach(el => el.classList.remove('ghost')); } catch {}
+          });
+        captures.exit().remove();
+
+        // point markers (subtle)
+        const allPts = series.flatMap(s => s.values.map(v => ({ run:s.run, color:s.color, tokens:v.tokens, value:v.value })));
+        const ptsSel = gPoints.selectAll('circle.pt').data(allPts, d=>`${d.run}-${d.tokens}`);
+        ptsSel.enter().append('circle').attr('class','pt').attr('r', 2).attr('fill', d=>d.color).attr('fill-opacity', 0.6)
+          .attr('cx', d=>xScale(d.tokens)).attr('cy', d=>yScale(d.value))
+          .merge(ptsSel).transition().duration(150).attr('cx', d=>xScale(d.tokens)).attr('cy', d=>yScale(d.value));
+        ptsSel.exit().remove();
+
+        // legend (HTML below, left) with title above items
+        legendBottom.innerHTML = `<div class="legend-title">Legend</div><div class="items">${series.map(s => `<span class="item" data-run="${s.run}"><span class="swatch" style="background:${s.color}"></span><span>${s.run}</span></span>`).join('')}</div>`;
+        // Legend hover → ghost lines/points
+        try {
+          const legendNode = legendBottom;
+          legendNode.querySelectorAll('.item').forEach(el => {
+            el.addEventListener('mouseenter', () => {
+              const run = el.getAttribute('data-run'); if (!run) return;
+              container.classList.add('hovering');
+              gLines.selectAll('path.run').classed('ghost', s => s.run !== run);
+              gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== run);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-run') !== run));
+            });
+            el.addEventListener('mouseleave', () => {
+              container.classList.remove('hovering');
+              gLines.selectAll('path.run').classed('ghost', false);
+              gPoints.selectAll('circle.pt').classed('ghost', false);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+            });
+          });
+        } catch {}
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          // nearest token value
+          const tokens = Array.from(new Set(allPts.map(p=>p.tokens))).sort((a,b)=>a-b);
+          const nearest = tokens.reduce((best, s) => Math.abs(s - sx) < Math.abs(best - sx) ? s : best, tokens[0]);
+          const xpx = xScale(nearest);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          // tooltip content (styled)
+          let html = `<div style=\"font-weight:800;letter-spacing:.1px;\">${prettyMetricLabel(metricKey)}</div><div style=\"font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;\">${formatTokens(nearest)} tokens</div>`;
+          const entries = series.map(s => {
+            const m = new Map(s.values.map(v=>[v.tokens, v.value]));
+            const val = m.get(nearest);
+            return { run: s.run, color: s.color, val };
+          }).filter(e => e.val != null);
+          entries.sort((a, b) => a.val - b.val);
+          entries.forEach(e => {
+            html += `<div style=\"display:flex;align-items:center;gap:6px;white-space:nowrap;\"><span class=\"d3-tooltip__color-dot\" style=\"background:${e.color}\"></span><strong>${e.run}</strong><span style=\"margin-left:auto;\">${(+e.val).toFixed(4)}</span></div>`;
+          });
+          tipInner.innerHTML = html; tip.style.opacity = '1'; tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        function onLeave(){ tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)'; hoverLine.style('display','none'); }
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          // Try multiple possible paths for the CSV file
+          const csvPaths = [
+            '/data/evals_tp_bug_fix_200B.csv',
+            './assets/data/evals_tp_bug_fix_200B.csv',
+            '../assets/data/evals_tp_bug_fix_200B.csv',
+            '../../assets/data/evals_tp_bug_fix_200B.csv'
+          ];
+          
+          let csvText = null;
+          for (const path of csvPaths) {
+            try {
+              const response = await fetch(path, { cache: 'no-cache' });
+              if (response.ok) {
+                csvText = await response.text();
+                break;
+              }
+            } catch(_) {}
+          }
+          
+          if (!csvText) {
+            throw new Error('CSV file not found: evals_tp_bug_fix_200B.csv');
+          }
+          const rows = d3.csvParse(csvText, d => ({
+            run: (d.run_name||'').trim(),
+            tokens: +d.tokens,
+            metric: (d.metric||'').trim(),
+            value: +d.value
+          }));
+          const metrics = Array.from(new Set(rows.map(r=>r.metric))).sort();
+          runOrder = Array.from(new Set(rows.map(r=>r.run))).sort();
+          metrics.forEach(m => {
+            const map = {}; runOrder.forEach(r => map[r] = []);
+            rows.filter(r=>r.metric===m).forEach(r => {
+              if (!isNaN(r.tokens) && !isNaN(r.value)) map[r.run].push({ tokens:r.tokens, value:r.value });
+            });
+            dataByMetric.set(m, map);
+          });
+          // populate metric select (pretty labels) or hide if single-file with single metric
+          const isSingleFile = true; // This is a single file
+          metrics.forEach(m => { const o = document.createElement('option'); o.value=m; o.textContent=prettyMetricLabel(m); selectMetric.appendChild(o); });
+          // default metric selection to hellaswag
+          if (metrics.length) {
+            let initial = metrics.find(m => m === 'hellaswag') || metrics[0];
+            selectMetric.value = initial;
+          }
+          if (isSingleFile && metrics.length <= 1) {
+            controls.style.display = 'none';
+          }
+
+          render(selectMetric.value);
+          selectMetric.addEventListener('change', () => render(selectMetric.value));
+          const rerender = () => render(selectMetric.value);
+          if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; pre.style.fontSize = '12px'; pre.style.whiteSpace = 'pre-wrap'; container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
diff --git a/app/src/content/embeds/d3-evals-tpbug.html b/app/src/content/embeds/d3-evals-tpbug.html
new file mode 100644
index 0000000000000000000000000000000000000000..1b1f4956d76550e1fdae500c18e8d2ae167abdf0
--- /dev/null
+++ b/app/src/content/embeds/d3-evals-tpbug.html
@@ -0,0 +1,400 @@
+<div class="d3-evals-tpbug"></div>
+<style>
+  .d3-evals-tpbug { position: relative; }
+  .d3-evals-tpbug .controls {
+    margin-top: 0;
+    display: flex;
+    gap: 16px;
+    align-items: center;
+    justify-content: flex-end;
+    width: auto;
+    flex-wrap: wrap;
+  }
+  .d3-evals-tpbug .controls label {
+    font-size: 12px;
+    color: var(--text-color);
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    white-space: nowrap;
+    font-weight: 700;
+  }
+  .d3-evals-tpbug .controls select {
+    font-size: 12px;
+    padding: 8px 28px 8px 10px;
+    border: 1px solid var(--border-color);
+    border-radius: 8px;
+    background-color: var(--surface-bg);
+    color: var(--text-color);
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+    background-repeat: no-repeat; background-position: right 8px center; background-size: 12px;
+    -webkit-appearance: none; appearance: none; cursor: pointer; transition: border-color .15s ease, box-shadow .15s ease;
+  }
+  [data-theme="dark"] .d3-evals-tpbug .controls select {
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+  }
+  .d3-evals-tpbug .controls select:hover { border-color: var(--primary-color); }
+  .d3-evals-tpbug .controls select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+  .d3-evals-tpbug .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .d3-evals-tpbug .axes path, .d3-evals-tpbug .axes line { stroke: var(--axis-color); }
+  .d3-evals-tpbug .axes text { fill: var(--tick-color); }
+  .d3-evals-tpbug .grid line { stroke: var(--grid-color); }
+  .d3-evals-tpbug .legend { font-size: 12px; color: var(--text-color);padding-left: 6px; }
+  .d3-evals-tpbug .legend .items { display:flex; flex-wrap:wrap; gap:8px 12px; align-items:center; }
+  .d3-evals-tpbug .legend .item { display:flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-evals-tpbug .legend .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  /* Ghosting on hover */
+  .d3-evals-tpbug.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .d3-evals-tpbug.hovering .lines path.ghost { opacity: .25; }
+  .d3-evals-tpbug.hovering .points circle.ghost { opacity: .25; }
+  .d3-evals-tpbug.hovering .areas path.ghost { opacity: .08; }
+  .d3-evals-tpbug .chart-header { display:flex; align-items:center; justify-content:space-between; gap:12px; margin: 0 0 8px 0; flex-wrap: wrap; }
+  .d3-evals-tpbug .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .d3-evals-tpbug .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .d3-evals-tpbug .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-evals-tpbug .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .d3-evals-tpbug .lines path.active { stroke-width: 3; }
+  /* Layout tweaks: stack label above select, add legend title above items */
+  .d3-evals-tpbug .controls .control-group {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-evals-tpbug .legend-bottom {
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-evals-tpbug .legend-bottom .legend-title {
+    font-size: 12px;
+    font-weight: 700;
+    color: var(--text-color);
+  }
+  /* Tooltip styling aligned with filters-quad */
+  .d3-evals-tpbug .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .d3-evals-tpbug .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .d3-evals-tpbug .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .d3-evals-tpbug .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .d3-evals-tpbug .d3-tooltip__inner > div:nth-child(n+3) { padding-top: 6px; border-top: 1px solid var(--border-color); }
+  .d3-evals-tpbug .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+  /* Chart card only around the SVG */
+  .d3-evals-tpbug .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  /* Place header below chart and align start */
+  .d3-evals-tpbug .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+</style>
+<script>
+  (() => {
+    // Pretty label mapping for metric keys
+    const prettyMetricLabel = (key) => {
+      if (!key) return '';
+      const table = {
+        'hellaswag': 'HellaSwag',
+        'mmlu': 'MMLU',
+        'arc': 'ARC',
+        'truthfulqa': 'TruthfulQA',
+        'gsm8k': 'GSM8K',
+        'winogrande': 'WinoGrande',
+        'openbookqa': 'OpenBookQA',
+        'piqa': 'PIQA',
+        'race': 'RACE',
+        'boolq': 'BoolQ',
+        'cb': 'CB',
+        'copa': 'COPA',
+        'multirc': 'MultiRC',
+        'record': 'ReCoRD',
+        'rte': 'RTE',
+        'wic': 'WiC',
+        'wsc': 'WSC'
+      };
+      if (table[key]) return table[key];
+      const cleaned = String(key).replace(/[_-]+/g, ' ').trim();
+      return cleaned.split(/\s+/).map(w => {
+        if (/^(mmlu|arc|gsm8k|piqa|race|boolq|multirc|record|wsc)$/i.test(w)) return w.toUpperCase();
+        return w.charAt(0).toUpperCase() + w.slice(1);
+      }).join(' ');
+    };
+
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-evals-tpbug'))){
+        const cs = Array.from(document.querySelectorAll('.d3-evals-tpbug')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Controls (we will place them in a footer below the chart)
+      const controls = document.createElement('div');
+      controls.className = 'controls';
+      const controlGroup = document.createElement('div');
+      controlGroup.className = 'control-group';
+      const labelMetric = document.createElement('label');
+      labelMetric.textContent = 'Metric';
+      const selectMetric = document.createElement('select');
+      // Associate label and select with a unique id
+      const uniqueId = Math.random().toString(36).slice(2, 9);
+      selectMetric.id = `metric-select-${uniqueId}`;
+      labelMetric.setAttribute('for', selectMetric.id);
+      controlGroup.appendChild(labelMetric);
+      controlGroup.appendChild(selectMetric);
+      controls.appendChild(controlGroup);
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend + controls) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+      header.appendChild(controls);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gAreas = gRoot.append('g').attr('class','areas');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      // (legend removed from inside SVG)
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 56 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.tokens)).y(d => yScale(d.value));
+      const dataByMetric = new Map();
+      let runOrder = [];
+
+      // Colors
+      function getRunColors(count){
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', count); } catch(_){}
+        return d3.schemeTableau10 ? d3.schemeTableau10.slice(0, count) : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'].slice(0, count);
+      }
+      
+      // Format helper for tokens (convert to billions)
+      function formatTokens(v){
+        const billions = v / 1e9;
+        return d3.format('.0f')(billions) + 'B';
+      }
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(metricKey){
+        const { innerWidth, innerHeight } = updateLayout();
+        const map = dataByMetric.get(metricKey) || {};
+        const runs = runOrder;
+        // domains
+        let minTokens = Infinity, maxTokens = -Infinity, minV = Infinity, maxV = -Infinity;
+        runs.forEach(r => { (map[r]||[]).forEach(pt => { minTokens = Math.min(minTokens, pt.tokens); maxTokens = Math.max(maxTokens, pt.tokens); minV = Math.min(minV, pt.value); maxV = Math.max(maxV, pt.value); }); });
+        if (!isFinite(minTokens) || !isFinite(maxTokens)) return;
+        xScale.domain([minTokens, maxTokens]).range([0, innerWidth]);
+        yScale.domain([minV, maxV]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatTokens)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Tokens (B)');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-44}, ${innerHeight/2}) rotate(-90)`).text('Score');
+
+        // lines
+        const series = runs.map((r, i) => ({ run:r, color: getRunColors(runs.length)[i % getRunColors(runs.length).length], values: (map[r]||[]).slice().sort((a,b)=>a.tokens-b.tokens) }));
+        const paths = gLines.selectAll('path.run').data(series, d=>d.run);
+        const pathsEnter = paths.enter().append('path').attr('class','run').attr('fill','none').attr('stroke-width',2).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        pathsEnter.merge(paths).transition().duration(200).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        paths.exit().remove();
+
+        // Hover capture paths (wider invisible stroke for easy hover)
+        const captures = gLines.selectAll('path.run-hover').data(series, d=>`cap-${d.run}`);
+        captures.enter().append('path').attr('class','run-hover').attr('fill','none').attr('stroke','transparent').attr('stroke-width', 12).style('pointer-events','stroke')
+          .attr('d', d=>lineGen(d.values))
+          .merge(captures)
+          .attr('d', d=>lineGen(d.values))
+          .on('mouseenter', function(ev, d){
+            container.classList.add('hovering');
+            // ghost non hovered lines and points
+            gLines.selectAll('path.run').classed('ghost', s => s.run !== d.run);
+            gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== d.run);
+            // ghost legend items
+            try {
+              const legendNode = legendBottom;
+              if (legendNode) {
+                legendNode.querySelectorAll('.item').forEach(el => {
+                  const name = el.getAttribute('data-run');
+                  el.classList.toggle('ghost', name !== d.run);
+                });
+              }
+            } catch {}
+          })
+          .on('mouseleave', function(){
+            container.classList.remove('hovering');
+            gLines.selectAll('path.run').classed('ghost', false);
+            gPoints.selectAll('circle.pt').classed('ghost', false);
+            try { const legendNode = legendBottom; if (legendNode) legendNode.querySelectorAll('.item').forEach(el => el.classList.remove('ghost')); } catch {}
+          });
+        captures.exit().remove();
+
+        // point markers (subtle)
+        const allPts = series.flatMap(s => s.values.map(v => ({ run:s.run, color:s.color, tokens:v.tokens, value:v.value })));
+        const ptsSel = gPoints.selectAll('circle.pt').data(allPts, d=>`${d.run}-${d.tokens}`);
+        ptsSel.enter().append('circle').attr('class','pt').attr('r', 2).attr('fill', d=>d.color).attr('fill-opacity', 0.6)
+          .attr('cx', d=>xScale(d.tokens)).attr('cy', d=>yScale(d.value))
+          .merge(ptsSel).transition().duration(150).attr('cx', d=>xScale(d.tokens)).attr('cy', d=>yScale(d.value));
+        ptsSel.exit().remove();
+
+        // legend (HTML below, left) with title above items
+        legendBottom.innerHTML = `<div class="legend-title">Legend</div><div class="items">${series.map(s => `<span class="item" data-run="${s.run}"><span class="swatch" style="background:${s.color}"></span><span>${s.run}</span></span>`).join('')}</div>`;
+        // Legend hover → ghost lines/points
+        try {
+          const legendNode = legendBottom;
+          legendNode.querySelectorAll('.item').forEach(el => {
+            el.addEventListener('mouseenter', () => {
+              const run = el.getAttribute('data-run'); if (!run) return;
+              container.classList.add('hovering');
+              gLines.selectAll('path.run').classed('ghost', s => s.run !== run);
+              gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== run);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-run') !== run));
+            });
+            el.addEventListener('mouseleave', () => {
+              container.classList.remove('hovering');
+              gLines.selectAll('path.run').classed('ghost', false);
+              gPoints.selectAll('circle.pt').classed('ghost', false);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+            });
+          });
+        } catch {}
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          // nearest token value
+          const tokens = Array.from(new Set(allPts.map(p=>p.tokens))).sort((a,b)=>a-b);
+          const nearest = tokens.reduce((best, s) => Math.abs(s - sx) < Math.abs(best - sx) ? s : best, tokens[0]);
+          const xpx = xScale(nearest);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          // tooltip content (styled)
+          let html = `<div style=\"font-weight:800;letter-spacing:.1px;\">${prettyMetricLabel(metricKey)}</div><div style=\"font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;\">${formatTokens(nearest)} tokens</div>`;
+          const entries = series.map(s => {
+            const m = new Map(s.values.map(v=>[v.tokens, v.value]));
+            const val = m.get(nearest);
+            return { run: s.run, color: s.color, val };
+          }).filter(e => e.val != null);
+          entries.sort((a, b) => a.val - b.val);
+          entries.forEach(e => {
+            html += `<div style=\"display:flex;align-items:center;gap:6px;white-space:nowrap;\"><span class=\"d3-tooltip__color-dot\" style=\"background:${e.color}\"></span><strong>${e.run}</strong><span style=\"margin-left:auto;\">${(+e.val).toFixed(4)}</span></div>`;
+          });
+          tipInner.innerHTML = html; tip.style.opacity = '1'; tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        function onLeave(){ tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)'; hoverLine.style('display','none'); }
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          // Try multiple possible paths for the CSV file
+          const csvPaths = [
+            '/data/evals_no_fixed_200B.csv',
+            './assets/data/evals_no_fixed_200B.csv',
+            '../assets/data/evals_no_fixed_200B.csv',
+            '../../assets/data/evals_no_fixed_200B.csv'
+          ];
+          
+          let csvText = null;
+          for (const path of csvPaths) {
+            try {
+              const response = await fetch(path, { cache: 'no-cache' });
+              if (response.ok) {
+                csvText = await response.text();
+                break;
+              }
+            } catch(_) {}
+          }
+          
+          if (!csvText) {
+            throw new Error('CSV file not found: evals_no_fixed_200B.csv');
+          }
+          const rows = d3.csvParse(csvText, d => ({
+            run: (d.run_name||'').trim(),
+            tokens: +d.tokens,
+            metric: (d.metric||'').trim(),
+            value: +d.value
+          }));
+          const metrics = Array.from(new Set(rows.map(r=>r.metric))).sort();
+          runOrder = Array.from(new Set(rows.map(r=>r.run))).sort();
+          metrics.forEach(m => {
+            const map = {}; runOrder.forEach(r => map[r] = []);
+            rows.filter(r=>r.metric===m).forEach(r => {
+              if (!isNaN(r.tokens) && !isNaN(r.value)) map[r.run].push({ tokens:r.tokens, value:r.value });
+            });
+            dataByMetric.set(m, map);
+          });
+          // populate metric select (pretty labels) or hide if single-file with single metric
+          const isSingleFile = true; // This is a single file
+          metrics.forEach(m => { const o = document.createElement('option'); o.value=m; o.textContent=prettyMetricLabel(m); selectMetric.appendChild(o); });
+          // default metric selection to hellaswag
+          if (metrics.length) {
+            let initial = metrics.find(m => m === 'hellaswag') || metrics[0];
+            selectMetric.value = initial;
+          }
+          if (isSingleFile && metrics.length <= 1) {
+            controls.style.display = 'none';
+          }
+
+          render(selectMetric.value);
+          selectMetric.addEventListener('change', () => render(selectMetric.value));
+          const rerender = () => render(selectMetric.value);
+          if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; pre.style.fontSize = '12px'; pre.style.whiteSpace = 'pre-wrap'; container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
diff --git a/app/src/content/embeds/d3-line-quad.html b/app/src/content/embeds/d3-line-quad.html
new file mode 100644
index 0000000000000000000000000000000000000000..7e1c77eb7923636d60c7263c83a0a703d14ac733
--- /dev/null
+++ b/app/src/content/embeds/d3-line-quad.html
@@ -0,0 +1,645 @@
+<div class="line-quad">
+  
+  <div class="line-quad__grid">
+    <div class="quad-cell" data-title="Formatting Filter" data-csv="/data/formatting_filters.csv"></div>
+    <div class="quad-cell" data-title="Relevance Filter" data-csv="/data/relevance_filters.csv"></div>
+    <div class="quad-cell" data-title="Visual Dependency Filter" data-csv="/data/visual_dependency_filters.csv"></div>
+    <div class="quad-cell" data-title="Image Correspondence Filter" data-csv="/data/image_correspondence_filters.csv"></div>
+  </div>
+  <noscript>JavaScript is required to render these charts.</noscript>
+
+</div>
+<style>
+  .line-quad { position: relative; }
+  /* Axis/tick/grid use global variables from _variables.css */
+  /* Apply axis/tick/grid purely via CSS */
+  .line-quad .axes path,
+  .line-quad .axes line { stroke: var(--axis-color); }
+  .line-quad .axes text { fill: var(--tick-color); }
+  .line-quad .grid line { stroke: var(--grid-color); }
+  .line-quad__grid { display:grid; grid-template-columns: repeat(2, minmax(0, 1fr)); gap: 12px; }
+  @media (max-width: 980px) { .line-quad__grid { grid-template-columns: 1fr; } }
+
+  
+
+  .quad-cell { border:1px solid var(--border-color); border-radius:10px; background: var(--surface-bg); display:flex; flex-direction:column; position: relative; }
+  /* Stacking order to ensure hover/tooltip overlays are not hidden by neighbors */
+  .line-quad__grid .quad-cell:nth-child(1) { z-index: 4; } /* top-left */
+  .line-quad__grid .quad-cell:nth-child(3) { z-index: 3; } /* bottom-left */
+  .line-quad__grid .quad-cell:nth-child(2) { z-index: 2; } /* top-right */
+  .line-quad__grid .quad-cell:nth-child(4) { z-index: 1; } /* bottom-right */
+  .quad-cell .cell-header { padding:8px 10px; border-bottom:1px solid var(--border-color); display:flex; align-items:center; justify-content:space-between; gap:8px; }
+  .quad-cell .cell-title { font-size: 13px; font-weight: 700; color: var(--text-color); }
+  .quad-cell .cell-controls { display:flex; align-items:center; gap:12px; }
+  .quad-cell .cell-controls label { font-size:12px; color: var(--muted-color); display:flex; align-items:center; gap:6px; white-space:nowrap; }
+  .quad-cell select {
+    font-size: 12px; padding: 6px 28px 6px 10px; border: 1px solid var(--border-color); border-radius: 8px;
+    background-color: var(--surface-bg); color: var(--text-color);
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='1' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+    background-repeat: no-repeat; background-position: right 8px center; background-size: 12px;
+    -webkit-appearance: none; appearance: none; cursor: pointer; transition: border-color .15s ease, box-shadow .15s ease;
+  }
+  [data-theme="dark"] .quad-cell select {
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='1' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+  }
+  .quad-cell select:hover { border-color: var(--primary-color); }
+  .quad-cell select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+  .quad-cell .cell-body { position: relative; }
+  .quad-cell .cell-body { width:100%; overflow:hidden; }
+  .quad-cell .cell-body svg { max-width:100%; height:auto; }
+  
+  .line-quad.hovering .lines path.ghost { opacity: .25; }
+  .line-quad.hovering .points circle.ghost { opacity: .25; }
+  .line-quad.hovering .areas path.ghost { opacity: .08; }
+  .line-quad.hovering .legend-bottom .item.ghost { opacity: .35; }
+  /* Tooltip refined styling */
+  .line-quad .d3-tooltip {
+    z-index: 20;
+    backdrop-filter: saturate(1.12) blur(8px);
+  }
+  .line-quad .d3-tooltip__inner {
+    display: flex;
+    flex-direction: column;
+    gap: 6px;
+    min-width: 220px;
+  }
+  .line-quad .d3-tooltip__inner > div:first-child {
+    font-weight: 800;
+    letter-spacing: 0.1px;
+    margin-bottom: 0;
+  }
+  .line-quad .d3-tooltip__inner > div:nth-child(2) {
+    font-size: 11px;
+    color: var(--muted-color);
+    display: block;
+    margin-top: -4px;
+    margin-bottom: 2px;
+    letter-spacing: 0.1px;
+  }
+  .line-quad .d3-tooltip__inner > div:nth-child(n+3) {
+    padding-top: 6px;
+    border-top: 1px solid var(--border-color);
+  }
+  .line-quad .d3-tooltip__inner svg {
+    display: inline-block;
+    vertical-align: middle;
+    margin-right: 2px;
+  }
+  .line-quad .d3-tooltip__inner strong {
+    margin-right: 6px;
+  }
+  .line-quad .d3-tooltip__color-dot {
+    display: inline-block;
+    width: 12px;
+    height: 12px;
+    border-radius: 3px;
+    border: 1px solid var(--border-color);
+  }
+  /* Header layout (like d3-line-simple) */
+  .line-quad__header {
+    display: flex;
+    align-items: flex-start;
+    justify-content: flex-start;
+    gap: 12px;
+    margin: 8px 0 0 0;
+    flex-wrap: wrap;
+  }
+  .line-quad__header .legend-bottom {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+    font-size: 12px;
+    color: var(--text-color);
+  }
+  .line-quad__header .legend-bottom .legend-title {
+    font-size: 12px;
+    font-weight: 700;
+    color: var(--text-color);
+  }
+  .line-quad__header .legend-bottom .items {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 8px 14px;
+  }
+  .line-quad__header .legend-bottom .item {
+    display: inline-flex;
+    align-items: center;
+    gap: 6px;
+    white-space: nowrap;
+  }
+  .line-quad__header .legend-bottom .swatch {
+    width: 14px;
+    height: 14px;
+    border-radius: 3px;
+    border: 1px solid var(--border-color);
+    display: inline-block;
+  }
+  .line-quad .controls {
+    margin-top: 0;
+    display: flex;
+    gap: 16px;
+    align-items: center;
+    justify-content: flex-end;
+    width: auto;
+    flex-wrap: wrap;
+  }
+  .line-quad .controls .control-group {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .line-quad .controls label {
+    font-size: 12px;
+    color: var(--text-color);
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    white-space: nowrap;
+    font-weight: 700;
+  }
+  .line-quad .controls select {
+    font-size: 12px;
+    padding: 8px 28px 8px 10px;
+    border: 1px solid var(--border-color);
+    border-radius: 8px;
+    background-color: var(--surface-bg);
+    color: var(--text-color);
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='1' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+    background-repeat: no-repeat;
+    background-position: right 8px center;
+    background-size: 12px;
+    -webkit-appearance: none;
+    appearance: none;
+    cursor: pointer;
+    transition: border-color .15s ease, box-shadow .15s ease;
+  }
+  [data-theme="dark"] .line-quad .controls select {
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='1' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+  }
+  .line-quad .controls select:hover { border-color: var(--primary-color); }
+  .line-quad .controls select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+</style>
+<script>
+  (() => {
+    const THIS_SCRIPT = document.currentScript;
+    // Shared run->color mapping to keep legend and series perfectly in sync
+    let SHARED_RUN_COLOR = null;
+    // Pretty label mapping for metric keys
+    const prettyMetricLabel = (key) => {
+      if (!key) return '';
+      const table = {
+        'ai2d_exact_match': 'AI2D Exact Match',
+        'average_rank': 'Average Rank',
+      };
+      if (table[key]) return table[key];
+      const cleaned = String(key).replace(/[_-]+/g, ' ').trim();
+      return cleaned.split(/\s+/).map(w => {
+        if (/^(ai2d|umap|id|auc|f1)$/i.test(w)) return w.toUpperCase();
+        return w.charAt(0).toUpperCase() + w.slice(1);
+      }).join(' ');
+    };
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    function initRunLine(cell){
+      const d3 = window.d3;
+      const csvPath = cell.getAttribute('data-csv');
+      const titleText = cell.getAttribute('data-title') || '';
+
+      // Header
+      const header = document.createElement('div'); header.className = 'cell-header';
+      const title = document.createElement('div'); title.className = 'cell-title'; title.textContent = titleText; header.appendChild(title);
+      // Per-cell controls supprimés (contrôle global utilisé)
+      cell.appendChild(header);
+
+      // Body & SVG
+      const body = document.createElement('div'); body.className = 'cell-body'; cell.appendChild(body);
+      const svg = d3.select(body).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gAreas = gRoot.append('g').attr('class','areas');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      const gHover = gRoot.append('g').attr('class','hover');
+      // Removed per-cell legend; using global footer legend
+
+      // Tooltip
+      cell.style.position = cell.style.position || 'relative';
+      let tip = cell.querySelector('.d3-tooltip'); let tipInner; let hideTipTimer = null;
+      if (!tip) {
+        tip = document.createElement('div');
+        tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute',
+          top:'0',
+          left:'0',
+          transform:'translate(-9999px,-9999px)',
+          pointerEvents:'none',
+          padding:'10px 12px',
+          borderRadius:'12px',
+          fontSize:'12px',
+          lineHeight:'1.35',
+          border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)',
+          color:'var(--text-color)',
+          boxShadow:'0 8px 32px rgba(0,0,0,.28), 0 2px 8px rgba(0,0,0,.12)',
+          opacity:'0',
+          transition:'opacity .12s ease',
+          backdropFilter:'saturate(1.12) blur(8px)'
+        });
+        tipInner = document.createElement('div');
+        tipInner.className = 'd3-tooltip__inner';
+        tipInner.style.textAlign='left';
+        tip.appendChild(tipInner);
+        cell.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // State
+      let metricList = []; let runList = []; let runOrder = []; const dataByMetric = new Map();
+      let width = 800, height = 340; const margin = { top: 16, right: 20, bottom: 46, left: 56 };
+      const xScale = d3.scaleLinear(); const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.step)).y(d => yScale(d.value));
+      let isRankStrictFlag = false; let isRankMetricFlag = false; let rankTickMax = 1;
+      let sharedYConfig = null; // { type: 'rank_strict', maxRank } | { type: 'value', min, max }
+      let axisLabelY = 'Value';
+      
+      // Colors and markers (match original embeds)
+      const getRunColors = (n) => {
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', n); } catch(_) {}
+        const primary = getComputedStyle(document.documentElement).getPropertyValue('--primary-color').trim() || '#E889AB';
+        return [primary, '#4EA5B7', '#E38A42', '#CEC0FA', ...(d3.schemeTableau10||[])].slice(0, n);
+      };
+      const pool = getRunColors(12);
+      // Shapes supprimés: on n'utilise que la couleur
+      // Ready signal for async load completion
+      let readyResolve = null;
+      const ready = new Promise((res)=> { readyResolve = res; });
+
+      // Shared formatter for thousands: 5000 -> 5k, 1500 -> 1.5k (trim .0)
+      const formatK = (v) => {
+        const abs = Math.abs(v);
+        if (abs >= 1000) {
+          const n = v / 1000;
+          const s = d3.format('.1f')(n);
+          return (s.endsWith('.0') ? s.slice(0, -2) : s) + 'k';
+        }
+        return d3.format('d')(v);
+      };
+
+      function updateScales(){
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        const axisColor = 'var(--axis-color)';
+        const tickColor = 'var(--tick-color)';
+        const gridColor = 'var(--grid-color)';
+
+        const rect = cell.getBoundingClientRect();
+        width = Math.max(1, Math.round(rect && rect.width ? rect.width : (cell.clientWidth || 800)));
+        height = Math.max(280, Math.round(width / 2.3));
+        svg.attr('width', width).attr('height', height).attr('viewBox', `0 0 ${width} ${height}`).attr('preserveAspectRatio','xMidYMid meet');
+        const innerWidth = width - margin.left - margin.right; const innerHeight = height - margin.top - margin.bottom;
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        xScale.range([0, innerWidth]); yScale.range([innerHeight, 0]);
+
+        // Y ticks
+        let yTicks = [];
+        if (isRankStrictFlag) { const maxR = Math.max(1, Math.round(rankTickMax)); for (let v=1; v<=maxR; v+=1) yTicks.push(v); }
+        else { yTicks = yScale.ticks(6); }
+
+        // Grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yTicks).join('line')
+          .attr('x1',0).attr('x2',innerWidth).attr('y1',d=>yScale(d)).attr('y2',d=>yScale(d))
+          .attr('stroke', gridColor).attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // Axes
+        gAxes.selectAll('*').remove();
+        let xAxis = d3.axisBottom(xScale).tickSizeOuter(0); xAxis = xAxis.ticks(8);
+        xAxis = xAxis.tickFormat(formatK);
+        const yAxis = d3.axisLeft(yScale).tickValues(yTicks).tickSizeOuter(0).tickFormat(isRankStrictFlag ? d3.format('d') : d3.format('.2f'));
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(xAxis).call(g=>{ g.selectAll('path, line').attr('stroke', axisColor); g.selectAll('text').attr('fill', tickColor).style('font-size','11px'); });
+        gAxes.append('g').call(yAxis).call(g=>{ g.selectAll('path, line').attr('stroke', axisColor); g.selectAll('text').attr('fill', tickColor).style('font-size','11px'); });
+
+        // Axis labels
+        gAxes.append('text')
+          .attr('class', 'x-axis-label')
+          .attr('x', innerWidth / 2)
+          .attr('y', innerHeight + Math.max(20, Math.min(36, margin.bottom - 10)))
+          .attr('fill', 'var(--text-color)')
+          .attr('text-anchor', 'middle')
+          .style('font-size', '12px')
+          .style('font-weight', '700')
+          .text('Steps');
+
+        gAxes.append('text')
+          .attr('class', 'y-axis-label')
+          .attr('transform', 'rotate(-90)')
+          .attr('x', -innerHeight / 2)
+          .attr('y', -Math.max(16, Math.min(28, margin.left - 8) + 10))
+          .attr('fill', 'var(--text-color)')
+          .attr('text-anchor', 'middle')
+          .style('font-size', '12px')
+          .style('font-weight', '700')
+          .text(axisLabelY);
+
+        return { innerWidth, innerHeight, tickColor };
+      }
+
+      function renderMetric(metricKey){
+        const map = dataByMetric.get(metricKey) || {};
+        const runs = runOrder;
+        let minStep = Infinity, maxStep = -Infinity, maxVal = 0, minVal = Infinity;
+        const isRank = /rank/i.test(metricKey); const isAverage = /average/i.test(metricKey); const isRankStrict = isRank && !isAverage;
+        runs.forEach(r => { (map[r]||[]).forEach(pt => { const v = isRankStrict ? Math.round(pt.value) : pt.value; minStep=Math.min(minStep,pt.step); maxStep=Math.max(maxStep,pt.step); maxVal=Math.max(maxVal,v); minVal=Math.min(minVal,v); }); });
+        if (!isFinite(minStep) || !isFinite(maxStep)) return;
+        xScale.domain([minStep, maxStep]);
+        if (sharedYConfig && sharedYConfig.type === 'rank_strict') {
+          rankTickMax = Math.max(1, Math.round(sharedYConfig.maxRank||1));
+          yScale.domain([rankTickMax, 1]);
+          isRankStrictFlag = true;
+          isRankMetricFlag = true;
+        } else if (sharedYConfig && sharedYConfig.type === 'value') {
+          yScale.domain([sharedYConfig.min, sharedYConfig.max]);
+          isRankStrictFlag = isRankStrict;
+          isRankMetricFlag = isRank;
+        } else {
+          if (isRank) { rankTickMax = Math.max(1, Math.round(maxVal)); yScale.domain([rankTickMax, 1]); }
+          else { yScale.domain([minVal, maxVal]).nice(); }
+          isRankStrictFlag = isRankStrict;
+          isRankMetricFlag = isRank;
+        }
+
+        axisLabelY = isRankStrict ? 'Rank' : prettyMetricLabel(metricKey);
+        const tChange = (window.d3 && d3.transition) ? d3.transition().duration(260).ease(d3.easeCubicOut) : null;
+        const { innerWidth, innerHeight } = updateScales();
+
+        const colorForRun = (run, idx) => {
+          if (SHARED_RUN_COLOR && Object.prototype.hasOwnProperty.call(SHARED_RUN_COLOR, run)) return SHARED_RUN_COLOR[run];
+          const j = (typeof idx === 'number' ? idx : runs.indexOf(run));
+          return pool[(j >= 0 ? j : 0) % pool.length];
+        };
+        const series = runs.map((r, i) => ({ run:r, color: colorForRun(r, i), values:(map[r]||[]).slice().sort((a,b)=>a.step-b.step).map(pt => isRankStrict ? { step: pt.step, value: Math.round(pt.value), stderr: pt.stderr } : pt) }));
+
+        // zones ± stderr (métriques non rank)
+        gAreas.selectAll('*').remove();
+        if (!isRank) {
+          series.forEach((s) => {
+            const withErr = s.values.filter(v => v && v.stderr != null && isFinite(v.stderr) && v.stderr > 0 && isFinite(v.value));
+            if (!withErr.length) return;
+            const upper = withErr.map(d => [xScale(d.step), yScale(d.value + d.stderr)]);
+            const lower = withErr.slice().reverse().map(d => [xScale(d.step), yScale(d.value - d.stderr)]);
+            const coords = upper.concat(lower);
+            const pathData = d3.line().x(d=>d[0]).y(d=>d[1]).curve(d3.curveLinearClosed)(coords);
+            gAreas.append('path')
+              .attr('class','area')
+              .attr('data-run', s.run)
+              .attr('d', pathData)
+              .attr('fill', s.color)
+              .attr('opacity', 0)
+              .attr('stroke', 'none')
+              .transition().duration(450).ease(d3.easeCubicOut)
+              .attr('opacity', 0.15);
+          });
+        }
+
+        const paths = gLines.selectAll('path.run-line').data(series, d=>d.run);
+        paths.enter()
+          .append('path')
+          .attr('class','run-line')
+          .attr('data-run', d=>d.run)
+          .attr('fill','none')
+          .attr('stroke-width', 1)
+          .attr('opacity',0)
+          .attr('stroke', d=>d.color)
+          .attr('d', d=>lineGen(d.values))
+          .transition(tChange || undefined)
+          .attr('opacity',0.9);
+        paths
+          .transition(tChange || undefined)
+          .attr('stroke', d=>d.color)
+          .attr('opacity',0.9)
+          .attr('d', d=>lineGen(d.values));
+        paths.exit().remove();
+
+        // Draw light point markers at each data sample (subtle)
+        const allPoints = series.flatMap(s => s.values.map(v => ({ run:s.run, color:s.color, step:v.step, value:v.value })));
+        const ptsSel = gPoints.selectAll('circle.pt').data(allPoints, d=> `${d.run}-${d.step}`);
+        ptsSel.enter().append('circle').attr('class','pt')
+          .attr('data-run', d=>d.run)
+          .attr('r', 1.5)
+          .attr('fill', d=>d.color)
+          .attr('fill-opacity', 0.6)
+          .attr('stroke', 'none')
+          .attr('cx', d=>xScale(d.step))
+          .attr('cy', d=>yScale(d.value))
+          .merge(ptsSel)
+          .attr('fill', d=>d.color)
+          .transition(tChange || undefined)
+          .attr('r', 2)
+          .attr('cx', d=>xScale(d.step))
+          .attr('cy', d=>yScale(d.value));
+        ptsSel.exit().remove();
+
+        // No per-cell legend content (handled globally)
+
+        // Hover
+        gHover.selectAll('*').remove();
+        const overlay = gHover.append('rect').attr('fill','transparent').style('cursor','crosshair').attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        const hoverLine = gHover.append('line').style('stroke','var(--text-color)').attr('stroke-opacity', 0.25).attr('stroke-width',1).attr('y1',0).attr('y2',innerHeight).style('display','none');
+        const stepSet = new Set(); series.forEach(s=>s.values.forEach(v=>stepSet.add(v.step))); const steps = Array.from(stepSet).sort((a,b)=>a-b);
+        function onMove(ev){ if (hideTipTimer) { clearTimeout(hideTipTimer); hideTipTimer = null; } const [mx,my]=d3.pointer(ev, overlay.node()); const nearest = steps.reduce((best,s)=> Math.abs(s - xScale.invert(mx)) < Math.abs(best - xScale.invert(mx)) ? s : best, steps[0]); const xpx = xScale(nearest); hoverLine.attr('x1',xpx).attr('x2',xpx).style('display',null);
+          let html = `<div><strong>${titleText}</strong></div><div><strong>step</strong> ${formatK(nearest)}</div>`;
+          const entries = series.map(s=>{ const map = new Map(s.values.map(v=>[v.step, v])); const pt = map.get(nearest); return { run:s.run, color:s.color, pt }; }).filter(e => e.pt && e.pt.value!=null);
+          entries.sort((a,b)=> (a.pt.value - b.pt.value));
+          const fmt = (vv)=> (isRankStrictFlag? d3.format('d')(vv) : (+vv).toFixed(4));
+          entries.forEach(e => {
+            const err = (e.pt.stderr!=null && isFinite(e.pt.stderr) && e.pt.stderr>0) ? ` ± ${fmt(e.pt.stderr)}` : '';
+            html += `<div style="display:flex;align-items:center;gap:8px;white-space:nowrap;"><span class=\"d3-tooltip__color-dot\" style=\"background:${e.color}\"></span><strong>${e.run}</strong><span style=\"margin-left:auto;text-align:right;\">${fmt(e.pt.value)}${err}</span></div>`;
+          });
+          tipInner.innerHTML = html; const offsetX=12, offsetY=12; tip.style.opacity='1'; tip.style.transform=`translate(${Math.round(mx+offsetX+margin.left)}px, ${Math.round(my+offsetY+margin.top)}px)`; }
+        function onLeave(){ hideTipTimer = setTimeout(()=>{ tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)'; hoverLine.style('display','none'); }, 100); }
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      async function load(){
+        try {
+          const file = (csvPath || '').split('/').pop();
+          const CANDIDATES = [
+            csvPath,
+            `/data/${file}`,
+            `./assets/data/${file}`,
+            `../assets/data/${file}`,
+            `../../assets/data/${file}`
+          ].filter(Boolean);
+          let text = null;
+          for (const p of CANDIDATES){
+            try { const r = await fetch(p, { cache:'no-cache' }); if (r.ok) { text = await r.text(); break; } } catch(e){}
+          }
+          if (text == null) throw new Error(`CSV not found: ${file}`);
+          const rows = d3.csvParse(text, d => ({ run:(d.run||'').trim(), step:+d.step, metric:(d.metric||'').trim(), value:+d.value, stderr: (d.stderr!=null && d.stderr!=='') ? +d.stderr : null }));
+          metricList = Array.from(new Set(rows.map(r=>r.metric))).sort();
+          runList = Array.from(new Set(rows.map(r=>r.run))).sort(); runOrder = runList;
+          metricList.forEach(m => { const map={}; runList.forEach(r=>map[r]=[]); rows.filter(r=>r.metric===m).forEach(r=>{ if(!isNaN(r.step)&&!isNaN(r.value)) map[r.run].push({ step:r.step, value:r.value, stderr:r.stderr }); }); dataByMetric.set(m, map); });
+          const preferred = metricList.find(m => m === 'ai2d_exact_match') || metricList.find(m => /average_rank/i.test(m));
+          const def = preferred || metricList[0];
+          renderMetric(def);
+          const ro = window.ResizeObserver ? new ResizeObserver(()=>renderMetric(def)) : null; if (ro) ro.observe(cell);
+          if (typeof readyResolve === 'function') readyResolve();
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; pre.style.fontSize = '12px'; pre.style.whiteSpace = 'pre-wrap'; cell.appendChild(pre);
+          if (typeof readyResolve === 'function') readyResolve();
+        }
+      }
+      load();
+      
+      return {
+        ready,
+        getMetrics: () => metricList.slice(),
+        setMetric: (m) => { if (m) renderMetric(m); },
+        getYInfo: (m) => {
+          const key = m; const map = dataByMetric.get(key) || {}; const runs = runOrder;
+          let maxVal = 0, minVal = Infinity; let minStep = Infinity, maxStep = -Infinity;
+          const isRank = /rank/i.test(key); const isAverage = /average/i.test(key); const isRankStrict = isRank && !isAverage;
+          runs.forEach(r => { (map[r]||[]).forEach(pt => { const v = isRankStrict ? Math.round(pt.value) : pt.value; minStep=Math.min(minStep,pt.step); maxStep=Math.max(maxStep,pt.step); maxVal=Math.max(maxVal,v); minVal=Math.min(minVal,v); }); });
+          const rankMax = isRank ? Math.max(1, Math.round(maxVal)) : null;
+          return { isRank, isRankStrict, min: maxVal === 0 && minVal === Infinity ? null : minVal, max: maxVal, rankMax };
+        },
+        setSharedY: (cfg) => { sharedYConfig = cfg || null; if (metricList && metricList.length) { /* re-render last metric if possible */ const current = cfg && cfg.key ? cfg.key : null; const m = current || metricList[0]; renderMetric(m); } }
+      };
+    }
+
+    const bootstrap = () => {
+      const scriptEl = THIS_SCRIPT;
+      let host = null;
+      // Build header (legend + controls) and append after grid
+      const header = document.createElement('div'); header.className = 'line-quad__header';
+      const legend = document.createElement('div'); legend.className = 'legend-bottom'; legend.innerHTML = '<div class="legend-title">Legend</div><div class="items"></div>';
+      const controls = document.createElement('div'); controls.className = 'controls'; controls.innerHTML = '<div class="control-group"><label>Metric</label><select></select></div>';
+      header.appendChild(legend);
+      header.appendChild(controls);
+      // Try finding within parent (fragment mount is inside parent)
+      if (scriptEl && scriptEl.parentElement && scriptEl.parentElement.querySelector) {
+        host = scriptEl.parentElement.querySelector('.line-quad');
+      }
+      // Fallback: scan previous siblings
+      if (!host) {
+        let sib = scriptEl && scriptEl.previousElementSibling;
+        while (sib && !(sib.classList && sib.classList.contains('line-quad'))) {
+          sib = sib.previousElementSibling;
+        }
+        host = sib || null;
+      }
+      // Last resort: global query
+      if (!host) { host = document.querySelector('.line-quad'); }
+      if (!host) return;
+      if (host.dataset && host.dataset.mounted === 'true') return; if (host.dataset) host.dataset.mounted = 'true';
+      const cells = host.querySelectorAll('.quad-cell'); if (!cells.length) return;
+      host.appendChild(header);
+      const instances = Array.from(cells).map(cell => initRunLine(cell));
+
+      (async () => {
+        // Wait for all charts to finish loading their CSVs
+        await Promise.all(instances.map(i => i.ready));
+        const lists = instances.map(i => i.getMetrics()).filter(a => Array.isArray(a) && a.length);
+        const intersect = (arrs) => arrs.reduce((acc, cur) => acc.filter(x => cur.includes(x)));
+        let metrics = lists.length ? intersect(lists) : [];
+        if (!metrics.length) { metrics = lists[0] || []; }
+        const def = (metrics.includes('ai2d_exact_match') ? 'ai2d_exact_match' : (metrics.find(m => /average_rank/i.test(m)) || metrics[0] || ''));
+
+        // Wire header controls (select under "Metric" label)
+        const headerEl = host.querySelector('.line-quad__header');
+        if (headerEl && !headerEl.isConnected) host.appendChild(header);
+        const select = (headerEl || header).querySelector('.controls select');
+        if (select) {
+          select.innerHTML = '';
+          metrics.forEach(m => { const o=document.createElement('option'); o.value=m; o.textContent=prettyMetricLabel(m); select.appendChild(o); });
+          if (def) select.value = def;
+        }
+
+        const computeAndApplySharedY = (metric) => {
+          try {
+            const infos = instances.map(i => i && typeof i.getYInfo === 'function' ? i.getYInfo(metric) : null).filter(Boolean);
+            if (!infos.length) return;
+            const anyRank = infos.some(info => info.isRank);
+            if (anyRank) {
+              const maxRank = Math.max(1, ...infos.map(info => Math.round(info.rankMax || 1)));
+              instances.forEach(i => i && typeof i.setSharedY === 'function' && i.setSharedY({ type: 'rank_strict', maxRank, key: metric }));
+            } else {
+              const min = Math.min(...infos.map(info => info.min));
+              const max = Math.max(...infos.map(info => info.max));
+              instances.forEach(i => i && typeof i.setSharedY === 'function' && i.setSharedY({ type: 'value', min, max, key: metric }));
+            }
+          } catch (_) {}
+        };
+
+        const applyAll = (v) => { computeAndApplySharedY(v); instances.forEach(i => i && typeof i.setMetric === 'function' && i.setMetric(v)); };
+        if (def) applyAll(def);
+        if (select) select.addEventListener('change', () => applyAll(select.value));
+
+        // Global legend (in header, colors only)
+        const legendItemsHost = (headerEl || header).querySelector('.legend-bottom .items');
+        if (legendItemsHost) {
+          try {
+            const f = '/data/formatting_filters.csv';
+            const r = await fetch(f, { cache:'no-cache' });
+            if (r.ok && window.d3 && window.d3.csvParse) {
+              const txt = await r.text();
+              const rows = window.d3.csvParse(txt);
+              const runList = Array.from(new Set(rows.map(row => String(row.run||'').trim()).filter(Boolean))).sort();
+              const poolLegend = (window.ColorPalettes && typeof window.ColorPalettes.getColors==='function')
+                ? window.ColorPalettes.getColors('categorical', runList.length)
+                : (()=>{ const primary = getComputedStyle(document.documentElement).getPropertyValue('--primary-color').trim() || '#E889AB'; return [primary, '#4EA5B7', '#E38A42', '#CEC0FA', ...((window.d3 && window.d3.schemeTableau10) ? window.d3.schemeTableau10 : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'])]; })();
+              // Build shared run->color map once
+              SHARED_RUN_COLOR = {};
+              runList.forEach((name, i) => { SHARED_RUN_COLOR[name] = poolLegend[i % poolLegend.length]; });
+              legendItemsHost.innerHTML = runList.map((name) => {
+                const color = SHARED_RUN_COLOR[name];
+                return `<span class="item" data-run="${name}"><span class=\"swatch\" style=\"background:${color}\"></span><span>${name}</span></span>`;
+              }).join('');
+              // Re-render all cells with the shared mapping to ensure perfect sync
+              try {
+                const currentMetric = (select && select.value) || def;
+                if (currentMetric) applyAll(currentMetric);
+              } catch {}
+              // Legend hover ghosting across all cells
+              legendItemsHost.querySelectorAll('.item').forEach(el => {
+                el.addEventListener('mouseenter', () => {
+                  const run = el.getAttribute('data-run'); if (!run) return;
+                  host.classList.add('hovering');
+                  host.querySelectorAll('.quad-cell').forEach(cell => {
+                    cell.querySelectorAll('.lines path.run-line').forEach(p => p.classList.toggle('ghost', p.getAttribute('data-run') !== run));
+                    cell.querySelectorAll('.points circle.pt').forEach(c => c.classList.toggle('ghost', c.getAttribute('data-run') !== run));
+                    cell.querySelectorAll('.areas path.area').forEach(a => a.classList.toggle('ghost', a.getAttribute('data-run') !== run));
+                  });
+                  legendItemsHost.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-run') !== run));
+                });
+                el.addEventListener('mouseleave', () => {
+                  host.classList.remove('hovering');
+                  host.querySelectorAll('.quad-cell').forEach(cell => {
+                    cell.querySelectorAll('.lines path.run-line').forEach(p => p.classList.remove('ghost'));
+                    cell.querySelectorAll('.points circle.pt').forEach(c => c.classList.remove('ghost'));
+                    cell.querySelectorAll('.areas path.area').forEach(a => a.classList.remove('ghost'));
+                  });
+                  legendItemsHost.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+                });
+              });
+            }
+          } catch {}
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
+
diff --git a/app/src/content/embeds/d3-line.html b/app/src/content/embeds/d3-line.html
new file mode 100644
index 0000000000000000000000000000000000000000..e3cd75e76ef628a06a23e233e24c98e98f103b12
--- /dev/null
+++ b/app/src/content/embeds/d3-line.html
@@ -0,0 +1,458 @@
+<div class="d3-line-simple"></div>
+<style>
+  .d3-line-simple { position: relative; }
+  .d3-line-simple .controls {
+    margin-top: 0;
+    display: flex;
+    gap: 16px;
+    align-items: center;
+    justify-content: flex-end;
+    width: auto;
+    flex-wrap: wrap;
+  }
+  .d3-line-simple .controls label {
+    font-size: 12px;
+    color: var(--text-color);
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    white-space: nowrap;
+    font-weight: 700;
+  }
+  .d3-line-simple .controls select {
+    font-size: 12px;
+    padding: 8px 28px 8px 10px;
+    border: 1px solid var(--border-color);
+    border-radius: 8px;
+    background-color: var(--surface-bg);
+    color: var(--text-color);
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%230f1115' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+    background-repeat: no-repeat; background-position: right 8px center; background-size: 12px;
+    -webkit-appearance: none; appearance: none; cursor: pointer; transition: border-color .15s ease, box-shadow .15s ease;
+  }
+  [data-theme="dark"] .d3-line-simple .controls select {
+    background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='0 0 24 24' fill='none' stroke='%23ffffff' stroke-width='2' stroke-linecap='round' stroke-linejoin='round'%3E%3Cpolyline points='6 9 12 15 18 9'/%3E%3C/svg%3E");
+  }
+  .d3-line-simple .controls select:hover { border-color: var(--primary-color); }
+  .d3-line-simple .controls select:focus { border-color: var(--primary-color); box-shadow: 0 0 0 3px rgba(232,137,171,.25); outline: none; }
+  .d3-line-simple .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .d3-line-simple .axes path, .d3-line-simple .axes line { stroke: var(--axis-color); }
+  .d3-line-simple .axes text { fill: var(--tick-color); }
+  .d3-line-simple .grid line { stroke: var(--grid-color); }
+  .d3-line-simple .legend { font-size: 12px; color: var(--text-color);padding-left: 6px; }
+  .d3-line-simple .legend .items { display:flex; flex-wrap:wrap; gap:8px 12px; align-items:center; }
+  .d3-line-simple .legend .item { display:flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-line-simple .legend .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  /* Ghosting on hover */
+  .d3-line-simple.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .d3-line-simple.hovering .lines path.ghost { opacity: .25; }
+  .d3-line-simple.hovering .points circle.ghost { opacity: .25; }
+  .d3-line-simple.hovering .areas path.ghost { opacity: .08; }
+  .d3-line-simple .chart-header { display:flex; align-items:center; justify-content:space-between; gap:12px; margin: 0 0 8px 0; flex-wrap: wrap; }
+  .d3-line-simple .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .d3-line-simple .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .d3-line-simple .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-line-simple .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .d3-line-simple .lines path.active { stroke-width: 3; }
+  /* Layout tweaks: stack label above select, add legend title above items */
+  .d3-line-simple .controls .control-group {
+    display: flex;
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-line-simple .legend-bottom {
+    flex-direction: column;
+    align-items: flex-start;
+    gap: 6px;
+  }
+  .d3-line-simple .legend-bottom .legend-title {
+    font-size: 12px;
+    font-weight: 700;
+    color: var(--text-color);
+  }
+  /* Tooltip styling aligned with filters-quad */
+  .d3-line-simple .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .d3-line-simple .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .d3-line-simple .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .d3-line-simple .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .d3-line-simple .d3-tooltip__inner > div:nth-child(n+3) { padding-top: 6px; border-top: 1px solid var(--border-color); }
+  .d3-line-simple .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+  /* Chart card only around the SVG */
+  .d3-line-simple .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  /* Place header below chart and align start */
+  .d3-line-simple .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+</style>
+<script>
+  (() => {
+    // Pretty label mapping for metric keys (aligned with filters-quad)
+    const prettyMetricLabel = (key) => {
+      if (!key) return '';
+      const table = {
+        'ai2d_exact_match': 'AI2D Exact Match',
+        'average_rank': 'Average Rank',
+      };
+      if (table[key]) return table[key];
+      const cleaned = String(key).replace(/[_-]+/g, ' ').trim();
+      return cleaned.split(/\s+/).map(w => {
+        if (/^(ai2d|umap|id|auc|f1)$/i.test(w)) return w.toUpperCase();
+        return w.charAt(0).toUpperCase() + w.slice(1);
+      }).join(' ');
+    };
+
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-line-simple'))){
+        const cs = Array.from(document.querySelectorAll('.d3-line-simple')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Controls (we will place them in a footer below the chart)
+      const controls = document.createElement('div');
+      controls.className = 'controls';
+      const controlGroup = document.createElement('div');
+      controlGroup.className = 'control-group';
+      const labelMetric = document.createElement('label');
+      labelMetric.textContent = 'Metric';
+      const selectMetric = document.createElement('select');
+      // Associate label and select with a unique id
+      const uniqueId = Math.random().toString(36).slice(2, 9);
+      selectMetric.id = `metric-select-${uniqueId}`;
+      labelMetric.setAttribute('for', selectMetric.id);
+      controlGroup.appendChild(labelMetric);
+      controlGroup.appendChild(selectMetric);
+      controls.appendChild(controlGroup);
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend + controls) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+      header.appendChild(controls);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gAreas = gRoot.append('g').attr('class','areas');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      // (legend removed from inside SVG)
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 56 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.step)).y(d => yScale(d.value));
+      const dataByMetric = new Map();
+      let runOrder = [];
+
+      // Colors
+      function getRunColors(count){
+        try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', count); } catch(_){}
+        return d3.schemeTableau10 ? d3.schemeTableau10.slice(0, count) : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'].slice(0, count);
+      }
+      // Format helper for thousands (5000 -> 5k, 1500 -> 1.5k)
+      function formatK(v){
+        const abs = Math.abs(v);
+        if (abs >= 1000) {
+          const n = v / 1000;
+          const s = d3.format('.1f')(n);
+          return (s.endsWith('.0') ? s.slice(0, -2) : s) + 'k';
+        }
+        return d3.format('d')(v);
+      }
+
+      // CSV: prefer public path, fallback to relative
+      // Data file(s) from HtmlEmbed attribute (string or JSON array), else default cascade
+      // Find the HtmlEmbed wrapper that carries data-datafiles
+      let mountEl = container;
+      while (mountEl && !mountEl.getAttribute?.('data-datafiles') && !mountEl.getAttribute?.('data-config')) {
+        mountEl = mountEl.parentElement;
+      }
+      let providedData = null;
+      let providedConfig = null;
+      try {
+        const attr = mountEl && mountEl.getAttribute ? mountEl.getAttribute('data-datafiles') : null;
+        if (attr && attr.trim()) {
+          providedData = attr.trim().startsWith('[') ? JSON.parse(attr) : attr.trim();
+        }
+      } catch(_) {}
+      try {
+        const cfg = mountEl && mountEl.getAttribute ? mountEl.getAttribute('data-config') : null;
+        if (cfg && cfg.trim()) {
+          providedConfig = cfg.trim().startsWith('{') ? JSON.parse(cfg) : cfg;
+        }
+      } catch(_) {}
+      const DEFAULT_CSV = '/data/formatting_filters.csv';
+      // Normalize: if a provided path has no slash, assume it lives under /data/
+      const ensureDataPrefix = (p) => {
+        if (typeof p !== 'string' || !p) return p;
+        return p.includes('/') ? p : `/data/${p}`;
+      };
+      const normalizeInput = (inp) => Array.isArray(inp) ? inp.map(ensureDataPrefix) : (typeof inp === 'string' ? [ ensureDataPrefix(inp) ] : null);
+      const CSV_PATHS = Array.isArray(providedData)
+        ? normalizeInput(providedData)
+        : (typeof providedData === 'string' ? normalizeInput(providedData) || [DEFAULT_CSV] : [
+            DEFAULT_CSV,
+            './assets/data/formatting_filters.csv',
+            '../assets/data/formatting_filters.csv',
+            '../../assets/data/formatting_filters.csv'
+          ]);
+      const fetchFirstAvailable = async (paths) => {
+        for (const p of paths) { try { const r = await fetch(p, { cache: 'no-cache' }); if (r.ok) return await r.text(); } catch(_){} }
+        throw new Error('CSV not found: formatting_filters.csv');
+      };
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(metricKey){
+        const { innerWidth, innerHeight } = updateLayout();
+        const map = dataByMetric.get(metricKey) || {};
+        const runs = runOrder;
+        // domains
+        let minStep = Infinity, maxStep = -Infinity, minV = Infinity, maxV = -Infinity;
+        runs.forEach(r => { (map[r]||[]).forEach(pt => { minStep = Math.min(minStep, pt.step); maxStep = Math.max(maxStep, pt.step); minV = Math.min(minV, pt.value); maxV = Math.max(maxV, pt.value); }); });
+        if (!isFinite(minStep) || !isFinite(maxStep)) return;
+        xScale.domain([minStep, maxStep]).range([0, innerWidth]);
+        yScale.domain([minV, maxV]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatK)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Step');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-44}, ${innerHeight/2}) rotate(-90)`).text('Value');
+
+        // shaded areas (stderr or min/max if provided)
+        gAreas.selectAll('*').remove();
+        const areaGenClosed = d3.line().x(d=>d[0]).y(d=>d[1]).curve(d3.curveLinearClosed);
+        // Colors (needed for both areas and lines)
+        const colors = getRunColors(runs.length);
+        const seriesForAreas = [];
+        runs.forEach((r, i) => {
+          const vals = (map[r]||[]).slice().sort((a,b)=>a.step-b.step);
+          const withBounds = vals.map(v => {
+            let lo = null, hi = null;
+            if (v.stderr != null && isFinite(v.stderr) && v.stderr > 0) { lo = v.value - v.stderr; hi = v.value + v.stderr; }
+            if (v.min != null && isFinite(v.min)) lo = (lo==null) ? v.min : lo;
+            if (v.max != null && isFinite(v.max)) hi = (hi==null) ? v.max : hi;
+            return { step: v.step, lo, hi };
+          }).filter(v => v.lo != null && v.hi != null && isFinite(v.lo) && isFinite(v.hi));
+          if (withBounds.length > 0) {
+            seriesForAreas.push({ run: r, color: colors[i % colors.length], bounds: withBounds });
+          }
+        });
+        seriesForAreas.forEach(s => {
+          const upper = s.bounds.map(d => [ xScale(d.step), yScale(d.hi) ]);
+          const lower = s.bounds.slice().reverse().map(d => [ xScale(d.step), yScale(d.lo) ]);
+          const coords = upper.concat(lower);
+          gAreas.append('path')
+            .attr('class','area')
+            .attr('data-run', s.run)
+            .attr('d', areaGenClosed(coords))
+            .attr('fill', s.color)
+            .attr('opacity', 0.15)
+            .attr('stroke','none');
+        });
+
+        // lines
+        const series = runs.map((r, i) => ({ run:r, color: colors[i % colors.length], values: (map[r]||[]).slice().sort((a,b)=>a.step-b.step) }));
+        const paths = gLines.selectAll('path.run').data(series, d=>d.run);
+        const pathsEnter = paths.enter().append('path').attr('class','run').attr('fill','none').attr('stroke-width',2).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        pathsEnter.merge(paths).transition().duration(200).attr('stroke', d=>d.color).attr('d', d=>lineGen(d.values));
+        paths.exit().remove();
+
+        // Hover capture paths (wider invisible stroke for easy hover)
+        const captures = gLines.selectAll('path.run-hover').data(series, d=>`cap-${d.run}`);
+        captures.enter().append('path').attr('class','run-hover').attr('fill','none').attr('stroke','transparent').attr('stroke-width', 12).style('pointer-events','stroke')
+          .attr('d', d=>lineGen(d.values))
+          .merge(captures)
+          .attr('d', d=>lineGen(d.values))
+          .on('mouseenter', function(ev, d){
+            container.classList.add('hovering');
+            // ghost non hovered lines and points
+            gLines.selectAll('path.run').classed('ghost', s => s.run !== d.run);
+            gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== d.run);
+            gAreas.selectAll('path.area').classed('ghost', a => a && a.getAttribute && a.getAttribute('data-run') !== d.run);
+            // ghost legend items
+            try {
+              const legendNode = legendBottom;
+              if (legendNode) {
+                legendNode.querySelectorAll('.item').forEach(el => {
+                  const name = el.getAttribute('data-run');
+                  el.classList.toggle('ghost', name !== d.run);
+                });
+              }
+            } catch {}
+          })
+          .on('mouseleave', function(){
+            container.classList.remove('hovering');
+            gLines.selectAll('path.run').classed('ghost', false);
+            gPoints.selectAll('circle.pt').classed('ghost', false);
+            gAreas.selectAll('path.area').classed('ghost', false);
+            try { const legendNode = legendBottom; if (legendNode) legendNode.querySelectorAll('.item').forEach(el => el.classList.remove('ghost')); } catch {}
+          });
+        captures.exit().remove();
+
+        // point markers (subtle)
+        const allPts = series.flatMap(s => s.values.map(v => ({ run:s.run, color:s.color, step:v.step, value:v.value })));
+        const ptsSel = gPoints.selectAll('circle.pt').data(allPts, d=>`${d.run}-${d.step}`);
+        ptsSel.enter().append('circle').attr('class','pt').attr('r', 2).attr('fill', d=>d.color).attr('fill-opacity', 0.6)
+          .attr('cx', d=>xScale(d.step)).attr('cy', d=>yScale(d.value))
+          .merge(ptsSel).transition().duration(150).attr('cx', d=>xScale(d.step)).attr('cy', d=>yScale(d.value));
+        ptsSel.exit().remove();
+
+        // legend (HTML below, left) with title above items
+        legendBottom.innerHTML = `<div class="legend-title">Legend</div><div class="items">${series.map(s => `<span class="item" data-run="${s.run}"><span class="swatch" style="background:${s.color}"></span><span>${s.run}</span></span>`).join('')}</div>`;
+        // Legend hover → ghost lines/points
+        try {
+          const legendNode = legendBottom;
+          legendNode.querySelectorAll('.item').forEach(el => {
+            el.addEventListener('mouseenter', () => {
+              const run = el.getAttribute('data-run'); if (!run) return;
+              container.classList.add('hovering');
+              gLines.selectAll('path.run').classed('ghost', s => s.run !== run);
+              gPoints.selectAll('circle.pt').classed('ghost', p => p.run !== run);
+              gAreas.selectAll('path.area').classed('ghost', a => a && a.getAttribute && a.getAttribute('data-run') !== run);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-run') !== run));
+            });
+            el.addEventListener('mouseleave', () => {
+              container.classList.remove('hovering');
+              gLines.selectAll('path.run').classed('ghost', false);
+              gPoints.selectAll('circle.pt').classed('ghost', false);
+              gAreas.selectAll('path.area').classed('ghost', false);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+            });
+          });
+        } catch {}
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          // nearest integer step if steps are integers; else nearest by distance
+          const steps = Array.from(new Set(allPts.map(p=>p.step))).sort((a,b)=>a-b);
+          const nearest = steps.reduce((best, s) => Math.abs(s - sx) < Math.abs(best - sx) ? s : best, steps[0]);
+          const xpx = xScale(nearest);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          // tooltip content (styled)
+          let html = `<div style=\"font-weight:800;letter-spacing:.1px;\">${metricKey}</div><div style=\"font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;\">Step ${formatK(nearest)}</div>`;
+          const entries = series.map(s => {
+            const m = new Map(s.values.map(v=>[v.step, v.value]));
+            const val = m.get(nearest);
+            return { run: s.run, color: s.color, val };
+          }).filter(e => e.val != null);
+          entries.sort((a, b) => a.val - b.val);
+          entries.forEach(e => {
+            html += `<div style=\"display:flex;align-items:center;gap:6px;white-space:nowrap;\"><span class=\"d3-tooltip__color-dot\" style=\"background:${e.color}\"></span><strong>${e.run}</strong><span style=\"margin-left:auto;\">${(+e.val).toFixed(4)}</span></div>`;
+          });
+          tipInner.innerHTML = html; tip.style.opacity = '1'; tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        function onLeave(){ tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)'; hoverLine.style('display','none'); }
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          const text = await fetchFirstAvailable(CSV_PATHS);
+          const rows = d3.csvParse(text, d => ({
+            run:(d.run||'').trim(),
+            step:+d.step,
+            metric:(d.metric||'').trim(),
+            value:+d.value,
+            // Optional bounds: stderr or [min,max] or [lower,upper]
+            stderr: (d.stderr!=null && d.stderr!=='') ? +d.stderr : null,
+            min: (d.min!=null && d.min!=='') ? +d.min : (d.lower!=null && d.lower!=='') ? +d.lower : null,
+            max: (d.max!=null && d.max!=='') ? +d.max : (d.upper!=null && d.upper!=='') ? +d.upper : null
+          }));
+          const metrics = Array.from(new Set(rows.map(r=>r.metric))).sort();
+          runOrder = Array.from(new Set(rows.map(r=>r.run))).sort();
+          metrics.forEach(m => {
+            const map = {}; runOrder.forEach(r => map[r] = []);
+            rows.filter(r=>r.metric===m).forEach(r => {
+              if (!isNaN(r.step) && !isNaN(r.value)) map[r.run].push({ step:r.step, value:r.value, stderr: r.stderr, min: r.min, max: r.max });
+            });
+            dataByMetric.set(m, map);
+          });
+          // populate metric select (pretty labels) or hide if single-file with single metric
+          const isSingleFile = !Array.isArray(providedData) && typeof providedData === 'string';
+          metrics.forEach(m => { const o = document.createElement('option'); o.value=m; o.textContent=prettyMetricLabel(m); selectMetric.appendChild(o); });
+          // default metric selection via config.defaultMetric (match raw key or pretty label, case-insensitive)
+          if (metrics.length) {
+            let initial = metrics[0];
+            const desired = providedConfig && typeof providedConfig === 'object' && providedConfig.defaultMetric ? String(providedConfig.defaultMetric) : null;
+            if (desired) {
+              const lcDesired = desired.toLowerCase();
+              const byKey = metrics.find(m => m.toLowerCase() === lcDesired);
+              const byPretty = metrics.find(m => prettyMetricLabel(m).toLowerCase() === lcDesired);
+              initial = byKey || byPretty || initial;
+            }
+            selectMetric.value = initial;
+          }
+          if (isSingleFile && metrics.length <= 1) {
+            controls.style.display = 'none';
+          }
+
+          render(selectMetric.value);
+          selectMetric.addEventListener('change', () => render(selectMetric.value));
+          const rerender = () => render(selectMetric.value);
+          if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; pre.style.fontSize = '12px'; pre.style.whiteSpace = 'pre-wrap'; container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/d3-matrix.html b/app/src/content/embeds/d3-matrix.html
new file mode 100644
index 0000000000000000000000000000000000000000..c72ef203e5c43f0c878463d2d6b2e2da382db2cf
--- /dev/null
+++ b/app/src/content/embeds/d3-matrix.html
@@ -0,0 +1,515 @@
+<div class="d3-matrix"  ></div>
+<style>
+  .d3-matrix {
+    position: relative;
+  }
+  .d3-matrix .panels {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 16px;
+    margin-bottom: 4px;
+  }
+  .d3-matrix .panel {
+    flex: 1 1 320px;
+    min-width: 280px;
+  }
+  .d3-matrix .panel__title {
+    color: var(--text-color);
+    font-size: 12px;
+    line-height: 1.35;
+    margin: 0 0 6px 0;
+    font-weight: 600;
+  }
+  .d3-matrix .axis-label {
+    fill: var(--text-color);
+    font-size: 11px;
+    font-weight: 700;
+  }
+  .d3-matrix .cell-border {
+    stroke: var(--border-color);
+    stroke-width: 1px;
+    fill: none;
+  }
+  .d3-matrix .cell-text {
+    fill: var(--muted-color);
+    font-size: 11px;
+    pointer-events: none;
+  }
+  .d3-matrix .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+</style>
+<script>
+  (() => {
+    // Load D3 from CDN once
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) {
+        s = document.createElement('script');
+        s.id = 'd3-cdn-script';
+        s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js';
+        document.head.appendChild(s);
+      }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-matrix'))){
+        const cs = Array.from(document.querySelectorAll('.d3-matrix')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) {
+        if (container.dataset.mounted === 'true') return;
+        container.dataset.mounted = 'true';
+      }
+
+      // Tooltip (HTML, single instance inside container)
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip');
+      let tipInner;
+      if (!tip) {
+        tip = document.createElement('div');
+        tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position: 'absolute',
+          top: '0px',
+          left: '0px',
+          transform: 'translate(-9999px, -9999px)',
+          pointerEvents: 'none',
+          padding: '8px 10px',
+          borderRadius: '8px',
+          fontSize: '12px',
+          lineHeight: '1.35',
+          border: '1px solid var(--border-color)',
+          background: 'var(--surface-bg)',
+          color: 'var(--text-color)',
+          boxShadow: '0 4px 24px rgba(0,0,0,.18)',
+          opacity: '0',
+          transition: 'opacity .12s ease'
+        });
+        tipInner = document.createElement('div');
+        tipInner.className = 'd3-tooltip__inner';
+        tipInner.style.textAlign = 'left';
+        tip.appendChild(tipInner);
+        container.appendChild(tip);
+      } else {
+        tipInner = tip.querySelector('.d3-tooltip__inner') || tip;
+      }
+
+      // Panels container (two side-by-side matrices)
+      const panels = document.createElement('div');
+      panels.className = 'panels';
+      const panelA = document.createElement('div');
+      panelA.className = 'panel';
+      const titleA = document.createElement('div'); titleA.className = 'panel__title'; titleA.textContent = 'Baseline (row-normalized %)';
+      panelA.appendChild(titleA);
+      const mountA = document.createElement('div'); panelA.appendChild(mountA);
+      const panelB = document.createElement('div');
+      panelB.className = 'panel';
+      const titleB = document.createElement('div'); titleB.className = 'panel__title'; titleB.textContent = 'Delta (Improved − Baseline, pp)';
+      panelB.appendChild(titleB);
+      const mountB = document.createElement('div'); panelB.appendChild(mountB);
+      panels.appendChild(panelA);
+      panels.appendChild(panelB);
+      container.appendChild(panels);
+
+      // SVG scaffolding
+      const cardA = document.createElement('div'); cardA.className = 'chart-card'; mountA.appendChild(cardA);
+      const svgA = d3.select(cardA).append('svg').attr('width', '100%').style('display', 'block');
+      const gRootA = svgA.append('g');
+      const gCellsA = gRootA.append('g');
+      const gAxesA = gRootA.append('g');
+      const cardB = document.createElement('div'); cardB.className = 'chart-card'; mountB.appendChild(cardB);
+      const svgB = d3.select(cardB).append('svg').attr('width', '100%').style('display', 'block');
+      const gRootB = svgB.append('g');
+      const gCellsB = gRootB.append('g');
+      const gAxesB = gRootB.append('g');
+
+      // Demo data (two distinct 10x10 matrices: Baseline vs Improved)
+      // Rows / Columns are generic class labels
+      const classes = ['0','1','2','3','4','5','6','7','8','9'];
+      const matrixA = [
+        [90,  2,  1,  0,  0,  0,  1,  0,  5,  1],
+        [ 3, 85,  5,  1,  0,  1,  2,  1,  1,  1],
+        [ 1,  6, 70, 10,  4,  4,  1,  1,  1,  2],
+        [ 0,  1,  8, 65, 10, 10,  2,  1,  1,  2],
+        [ 0,  0,  2,  6, 83,  3,  1,  1,  3,  1],
+        [ 0,  1,  2, 12,  4, 70,  5,  2,  2,  2],
+        [ 1,  2,  1,  0,  1,  2, 88,  1,  3,  1],
+        [ 0,  1,  1,  1,  1,  1,  2, 90,  1,  2],
+        [ 6,  2,  2,  4,  6,  3,  3,  2, 70,  2],
+        [ 1,  1,  1,  1,  2,  1,  1,  2,  1, 89]
+      ];
+      const matrixB = [
+        [94,  1,  0,  0,  0,  0,  1,  0,  3,  1],
+        [ 2, 90,  3,  1,  0,  0,  1,  1,  1,  1],
+        [ 1,  4, 78,  7,  3,  3,  1,  1,  1,  1],
+        [ 0,  1,  5, 74,  7,  8,  1,  1,  1,  2],
+        [ 0,  0,  1,  4, 88,  2,  1,  1,  2,  1],
+        [ 0,  1,  1,  9,  3, 78,  3,  1,  2,  2],
+        [ 1,  1,  1,  0,  1,  1, 91,  1,  2,  1],
+        [ 0,  1,  1,  1,  1,  1,  1, 92,  1,  1],
+        [ 4,  1,  1,  3,  4,  2,  2,  2, 79,  2],
+        [ 1,  1,  1,  1,  2,  1,  1,  1,  1, 90]
+      ];
+
+      // Colors: sequential palette via window.ColorPalettes with graceful fallback
+      const getSequentialColors = (count) => {
+        try {
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            return window.ColorPalettes.getColors('sequential', count);
+          }
+        } catch (_) {}
+        // Fallback: generate a monochrome scale using the primary color with varying opacity
+        const arr = [];
+        for (let i = 0; i < count; i++) arr.push('var(--primary-color)');
+        return arr;
+      };
+
+      const palette = getSequentialColors(13);
+      const getDivergingColors = (count) => {
+        try {
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            return window.ColorPalettes.getColors('diverging', count);
+          }
+        } catch (_) {}
+        const steps = Math.max(3, count|0);
+        const arr = [];
+        for (let i = 0; i < steps; i++) {
+          const t = i / (steps - 1);
+          const pct = Math.round(t * 100);
+          arr.push(`color-mix(in srgb, #D64545 ${100-pct}%, #3A7BD5 ${pct}%)`);
+        }
+        return arr;
+      };
+
+      let width = 800;
+      let height = 480;
+      const margin = { top: 36, right: 24, bottom: 26, left: 56 };
+
+      function updateSize() {
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        width = container.clientWidth || 800;
+        const gap = 16; // matches CSS .panels gap
+        const minPanel = 320;
+        const nCols = (width >= (minPanel * 2 + gap)) ? 2 : 1;
+        const panelWidth = nCols === 2 ? Math.max(minPanel, Math.floor((width - gap) / 2)) : Math.max(minPanel, width);
+        const base = Math.max(minPanel, Math.round(panelWidth * 0.92));
+        height = base;
+        // Responsive SVG: width 100%, height auto, preserve aspect via viewBox
+        svgA
+          .attr('viewBox', `0 0 ${panelWidth} ${height}`)
+          .attr('preserveAspectRatio', 'xMidYMid meet')
+          .style('width', '100%')
+          .style('height', 'auto');
+        svgB
+          .attr('viewBox', `0 0 ${panelWidth} ${height}`)
+          .attr('preserveAspectRatio', 'xMidYMid meet')
+          .style('width', '100%')
+          .style('height', 'auto');
+        gRootA.attr('transform', `translate(${margin.left},${margin.top})`);
+        gRootB.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = panelWidth - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        return { innerWidth, innerHeight, isDark };
+      }
+
+      function computeValues(normalization, matrix) {
+        const n = classes.length;
+        const totalsByRow = matrix.map(row => row.reduce((a, b) => a + b, 0));
+        const flat = [];
+        let minV = Infinity, maxV = -Infinity;
+        for (let r = 0; r < n; r++) {
+          for (let c = 0; c < n; c++) {
+            const count = matrix[r][c];
+            const value = normalization === 'row' ? (totalsByRow[r] ? count / totalsByRow[r] : 0) : count;
+            if (value < minV) minV = value;
+            if (value > maxV) maxV = value;
+            flat.push({ r, c, count, value });
+          }
+        }
+        return { data: flat, minV, maxV };
+      }
+
+      function getColorScale(values, minV, maxV) {
+        // If ColorPalettes is available, use quantiles to enhance visual variation across the distribution
+        const hasPalette = !(palette.length === 0);
+        if (hasPalette && (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function')) {
+          const scale = d3.scaleQuantile().domain(values).range(palette);
+          return (v) => scale(v);
+        }
+        // Fallback: primary color with opacity mapped to normalized value
+        const norm = d3.scaleLinear().domain([minV, maxV]).range([0.08, 0.9]).clamp(true);
+        return (v) => `color-mix(in oklab, var(--primary-color) ${Math.round(norm(v) * 100)}%, var(--surface-bg))`;
+      }
+
+      // Compute a fixed readable text color from a CSS rgb()/rgba() string
+      function chooseFixedReadableTextOnBg(bgCss){
+        try {
+          const m = String(bgCss||'').match(/rgba?\(([^)]+)\)/);
+          if (!m) return '#0e1116';
+          const parts = m[1].split(',').map(s => parseFloat(s.trim()));
+          const [r, g, b] = parts;
+          // sRGB → relative luminance
+          const srgb = [r, g, b].map(v => Math.max(0, Math.min(255, v)) / 255);
+          const linear = srgb.map(c => (c <= 0.03928 ? c/12.92 : Math.pow((c + 0.055)/1.055, 2.4)));
+          const L = 0.2126*linear[0] + 0.7152*linear[1] + 0.0722*linear[2];
+          // Threshold ~ 0.5 for readability; darker BG → white text, else near-black
+          return L < 0.5 ? '#ffffff' : '#0e1116';
+        } catch(_) { return '#0e1116'; }
+      }
+
+      function render() {
+        const { innerWidth, innerHeight } = updateSize();
+        const n = classes.length;
+        const gridSize = Math.min(innerWidth, innerHeight);
+        const cellSize = gridSize / n;
+
+        const x = d3.scaleBand().domain(d3.range(n)).range([0, gridSize]).paddingInner(0.06);
+        const y = d3.scaleBand().domain(d3.range(n)).range([0, gridSize]).paddingInner(0.06);
+
+        // Panel A: Baseline (row-normalized)
+        const dataA = computeValues('row', matrixA);
+        const colorA = getColorScale(dataA.data.map(d => d.value), dataA.minV, dataA.maxV);
+
+        gCellsA.selectAll('rect.cell-bg')
+          .data([0])
+          .join('rect')
+          .attr('class', 'cell-bg')
+          .attr('x', 0)
+          .attr('y', 0)
+          .attr('width', gridSize)
+          .attr('height', gridSize)
+          .attr('fill', 'none')
+          .attr('stroke', 'var(--border-color)')
+          .attr('stroke-width', 1);
+
+        const cellsA = gCellsA.selectAll('g.cell')
+          .data(dataA.data, d => `${d.r}-${d.c}-A`);
+
+        const cellsEnterA = cellsA.enter()
+          .append('g')
+          .attr('class', 'cell');
+
+        cellsEnterA.append('rect')
+          .attr('rx', 2)
+          .attr('ry', 2)
+          .on('mousemove', (event, d) => {
+            const [px, py] = d3.pointer(event, container);
+            tipInner.innerHTML = `<strong>${classes[d.r]}</strong> → <strong>${classes[d.c]}</strong><br/>${(d.value * 100).toFixed(1)}% (${d.count})`;
+            tip.style.transform = `translate(${px + 10}px, ${py + 10}px)`;
+            tip.style.opacity = '1';
+          })
+          .on('mouseleave', () => {
+            tip.style.opacity = '0';
+          });
+
+        cellsEnterA.append('text')
+          .attr('class', 'cell-text')
+          .attr('text-anchor', 'middle')
+          .attr('dominant-baseline', 'middle');
+
+        const cellsMergedA = cellsEnterA.merge(cellsA);
+
+        cellsMergedA.select('text')
+          .attr('x', d => x(d.c) + x.bandwidth() / 2)
+          .attr('y', d => y(d.r) + y.bandwidth() / 2)
+          .text(d => `${Math.round(d.value * 100)}`)
+          .style('fill', function(d){
+            try {
+              const rect = this && this.parentNode ? this.parentNode.querySelector('rect') : null;
+              const bg = rect ? getComputedStyle(rect).fill : colorA(d.value);
+              return chooseFixedReadableTextOnBg(bg);
+            } catch (_) {
+              return '#0e1116';
+            }
+          });
+
+        cellsMergedA.select('rect')
+          .attr('x', d => x(d.c))
+          .attr('y', d => y(d.r))
+          .attr('width', Math.max(1, x.bandwidth()))
+          .attr('height', Math.max(1, y.bandwidth()))
+          .attr('fill', d => colorA(d.value));
+
+        cellsA.exit().remove();
+
+        gAxesA.selectAll('*').remove();
+
+        gAxesA.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', (_, i) => x(i) + x.bandwidth() / 2)
+          .attr('y', -8)
+          .text(d => d);
+
+        gAxesA.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'end')
+          .attr('x', -8)
+          .attr('y', (_, i) => y(i) + y.bandwidth() / 2)
+          .attr('dominant-baseline', 'middle')
+          .text(d => d);
+
+        gAxesA.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', gridSize / 2)
+          .attr('y', innerHeight + 20)
+          .text('Columns');
+
+        gAxesA.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('transform', `translate(${-40}, ${gridSize / 2}) rotate(-90)`)
+          .text('Rows');
+
+        // Panel B: Delta (Improved − Baseline), row-normalized differences in percentage points
+        const dataB = computeValues('row', matrixB);
+        const diverging = getDivergingColors(13);
+        // Build delta values aligned to A's ordering
+        const mapA = new Map(dataA.data.map(d => [d.r + '-' + d.c, d.value]));
+        const delta = dataB.data.map(d => ({ r: d.r, c: d.c, count: d.count, value: (d.value - (mapA.get(d.r + '-' + d.c) || 0)) }));
+        // Symmetric domain around 0 (in proportions), express later as pp in labels
+        const maxAbsDelta = Math.max(0.01, d3.max(delta, d => Math.abs(d.value)) || 0.01);
+        const colorB = d3.scaleQuantize().domain([-maxAbsDelta, maxAbsDelta]).range(diverging);
+
+        gCellsB.selectAll('rect.cell-bg')
+          .data([0])
+          .join('rect')
+          .attr('class', 'cell-bg')
+          .attr('x', 0)
+          .attr('y', 0)
+          .attr('width', gridSize)
+          .attr('height', gridSize)
+          .attr('fill', 'none')
+          .attr('stroke', 'var(--border-color)')
+          .attr('stroke-width', 1);
+
+        const cellsB = gCellsB.selectAll('g.cell')
+          .data(dataB.data, d => `${d.r}-${d.c}-B`);
+
+        const cellsEnterB = cellsB.enter()
+          .append('g')
+          .attr('class', 'cell');
+
+        cellsEnterB.append('rect')
+          .attr('rx', 2)
+          .attr('ry', 2)
+          .on('mousemove', (event, d) => {
+            const [px, py] = d3.pointer(event, container);
+            const a = dataA.data.find(x => x.r===d.r && x.c===d.c);
+            const b = dataB.data.find(x => x.r===d.r && x.c===d.c);
+            const dv = ((b ? b.value : 0) - (a ? a.value : 0)) * 100;
+            tipInner.innerHTML = `<strong>${classes[d.r]}</strong> → <strong>${classes[d.c]}</strong>` +
+              `<br/>baseline ${(a ? a.value*100 : 0).toFixed(1)}%` +
+              `<br/>improved ${(b ? b.value*100 : 0).toFixed(1)}%` +
+              `<br/>delta ${dv.toFixed(1)} pp`;
+            tip.style.transform = `translate(${px + 10}px, ${py + 10}px)`;
+            tip.style.opacity = '1';
+          })
+          .on('mouseleave', () => {
+            tip.style.opacity = '0';
+          });
+
+        cellsEnterB.append('text')
+          .attr('class', 'cell-text')
+          .attr('text-anchor', 'middle')
+          .attr('dominant-baseline', 'middle');
+
+        const cellsMergedB = cellsEnterB.merge(cellsB);
+
+        cellsMergedB.select('rect')
+          .attr('x', d => x(d.c))
+          .attr('y', d => y(d.r))
+          .attr('width', Math.max(1, x.bandwidth()))
+          .attr('height', Math.max(1, y.bandwidth()))
+          .attr('fill', d => colorB(delta.find(x => x.r===d.r && x.c===d.c).value));
+
+        cellsMergedB.select('text')
+          .attr('x', d => x(d.c) + x.bandwidth() / 2)
+          .attr('y', d => y(d.r) + y.bandwidth() / 2)
+          .text(d => {
+            const dv = delta.find(x => x.r===d.r && x.c===d.c).value; return `${Math.round(dv * 100)}`;
+          })
+          .style('fill', function(d){
+            try {
+              const rect = this && this.parentNode ? this.parentNode.querySelector('rect') : null;
+              const dv = delta.find(x => x.r===d.r && x.c===d.c).value;
+              const bg = rect ? getComputedStyle(rect).fill : colorB(dv);
+              return chooseFixedReadableTextOnBg(bg);
+            } catch (_) {
+              return '#0e1116';
+            }
+          });
+
+        cellsB.exit().remove();
+
+        gAxesB.selectAll('*').remove();
+
+        gAxesB.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', (_, i) => x(i) + x.bandwidth() / 2)
+          .attr('y', -8)
+          .text(d => d);
+
+        gAxesB.append('g')
+          .selectAll('text')
+          .data(classes)
+          .join('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'end')
+          .attr('x', -8)
+          .attr('y', (_, i) => y(i) + y.bandwidth() / 2)
+          .attr('dominant-baseline', 'middle')
+          .text(d => d);
+
+        gAxesB.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('x', gridSize / 2)
+          .attr('y', innerHeight + 20)
+          .text('Columns');
+
+        gAxesB.append('text')
+          .attr('class', 'axis-label')
+          .attr('text-anchor', 'middle')
+          .attr('transform', `translate(${-40}, ${gridSize / 2}) rotate(-90)`)
+          .text('Rows');
+      }
+
+      // Initial render + resize handling
+      render();
+      const rerender = () => render();
+      if (window.ResizeObserver) {
+        const ro = new ResizeObserver(() => rerender());
+        ro.observe(container);
+      } else {
+        window.addEventListener('resize', rerender);
+      }
+    };
+
+    if (document.readyState === 'loading') {
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true });
+    } else {
+      ensureD3(bootstrap);
+    }
+  })();
+</script>
+
+
+
diff --git a/app/src/content/embeds/d3-neural-network.html b/app/src/content/embeds/d3-neural-network.html
new file mode 100644
index 0000000000000000000000000000000000000000..c64f407c4432b2fe6c75590f18e6110ba9a11797
--- /dev/null
+++ b/app/src/content/embeds/d3-neural-network.html
@@ -0,0 +1,758 @@
+<div class="d3-neural"></div>
+<style>
+  .d3-neural { position: relative; width:100%;margin:0;}
+  .d3-neural .controls { margin-top: 12px; display: flex; gap: 12px; align-items: center; flex-wrap: wrap; }
+  .d3-neural .controls label { font-size: 12px; color: var(--muted-color); display: flex; align-items: center; gap: 8px; white-space: nowrap; padding: 6px 10px; }
+  .d3-neural .controls input[type="range"]{ width: 160px; }
+  .d3-neural .panel { display:flex; gap:8px; align-items:stretch; flex-wrap: nowrap; }
+  .d3-neural .left { flex: 0 0 33.333%; max-width: 33.333%; min-width: 160px; display:flex; flex-direction:column; gap:8px; }
+  .d3-neural .right { flex: 1 1 66.666%; max-width: 66.666%; min-width: 280px; display:flex; }
+  .d3-neural .right > svg { flex: 1 1 auto; height: 100%; }
+  .d3-neural .arrow-sep { flex: 0 0 18px; max-width: 18px; display:flex; align-items:center; justify-content:center; color: var(--muted-color); }
+  .d3-neural .arrow-sep svg { display:block; width: 16px; height: 16px; }
+  @media (max-width: 800px) {
+    .d3-neural .panel { flex-direction: column; }
+    .d3-neural .left,
+    .d3-neural .right { flex: 0 0 100%; max-width: 100%; min-width: 0; }
+    .d3-neural .arrow-sep { display: none; }
+  }
+  .d3-neural canvas { width: 100%; height: auto; border-radius: 8px; border: 1px solid var(--border-color); background: var(--surface-bg); display:block; }
+  .d3-neural .preview28 { display:grid; grid-template-columns: repeat(28, 1fr); gap: 1px; width: 100%; }
+  .d3-neural .preview28 span { display:block; aspect-ratio:1/1; border-radius:2px; }
+  .d3-neural .legend { font-size: 12px; color: var(--text-color); line-height:1.35; }
+  .d3-neural .probs { display:flex; gap:6px; align-items:flex-end; height: 64px; }
+  .d3-neural .probs .bar { width: 10px; border-radius:2px 2px 0 0; background: var(--border-color); transition: height .15s ease, background-color .15s ease; }
+  .d3-neural .probs .bar.active { background: var(--primary-color); }
+  .d3-neural .probs .tick { font-size: 10px; color: var(--muted-color); text-align:center; margin-top: 2px; }
+  .d3-neural .canvas-wrap { position: relative; }
+  .d3-neural .erase-btn { position: absolute; top: 8px; right: 8px; width: 32px; height: 32px; display:flex; align-items:center; justify-content:center; border: 1px solid var(--border-color);  }
+  .d3-neural .canvas-hint { position: absolute; top: 8px; left: 12px; font-size: 12px; font-weight: 700; color: rgba(0,0,0,.9); pointer-events: none; transition: opacity .12s ease; }
+  
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const ensureTF = (cb) => {
+      if (window.tf && typeof window.tf.tensor === 'function') return cb();
+      let s = document.getElementById('tfjs-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'tfjs-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/@tensorflow/tfjs@4.20.0/dist/tf.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.tf && typeof window.tf.tensor === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.tf) onReady();
+    };
+
+    const bootstrap = () => {
+      const mount = document.currentScript ? document.currentScript.previousElementSibling : null;
+      const container = (mount && mount.querySelector && mount.querySelector('.d3-neural')) || document.querySelector('.d3-neural');
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // (tooltip removed)
+
+      // Layout: left (canvas + preview + controls), right (svg network)
+      const panel = document.createElement('div');
+      panel.className = 'panel';
+      const left = document.createElement('div'); left.className = 'left';
+      const arrowSep = document.createElement('div'); arrowSep.className = 'arrow-sep';
+      arrowSep.innerHTML = '<svg viewBox="0 0 24 24" xmlns="http://www.w3.org/2000/svg" aria-hidden="true"><line x1="3" y1="12" x2="19" y2="12" stroke="currentColor" stroke-width="2" stroke-linecap="round"/><polyline points="17,7 22,12 17,17" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"/></svg>';
+      const right = document.createElement('div'); right.className = 'right';
+      panel.appendChild(left); panel.appendChild(arrowSep); panel.appendChild(right);
+      container.appendChild(panel);
+
+      // Canvas for drawing
+      const CANVAS_PX = 224; // canvas pixels (square)
+      const canvas = document.createElement('canvas'); canvas.width = CANVAS_PX; canvas.height = CANVAS_PX;
+      const ctx = canvas.getContext('2d');
+      // init white bg
+      ctx.fillStyle = '#ffffff'; ctx.fillRect(0,0,CANVAS_PX,CANVAS_PX);
+      const canvasWrap = document.createElement('div'); canvasWrap.className = 'canvas-wrap';
+      canvasWrap.appendChild(canvas);
+      // Erase icon button (top-right)
+      const eraseBtn = document.createElement('button'); eraseBtn.className='erase-btn button--ghost'; eraseBtn.type='button'; eraseBtn.setAttribute('aria-label','Clear');
+      // Hidden until the user interacts with the canvas
+      eraseBtn.style.display = 'none';
+      eraseBtn.innerHTML = '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><polyline points="3 6 5 6 21 6"></polyline><path d="M19 6l-1 14a2 2 0 0 1-2 2H8a2 2 0 0 1-2-2L5 6"></path><path d="M10 11v6"></path><path d="M14 11v6"></path><path d="M9 6V4a2 2 0 0 1 2-2h2a2 2 0 0 1 2 2v2"></path></svg>';
+      eraseBtn.addEventListener('click', () => clearCanvas());
+      canvasWrap.appendChild(eraseBtn);
+      // Hint (top-left)
+      const hint = document.createElement('div'); hint.className='canvas-hint'; hint.textContent='Draw a digit here';
+      canvasWrap.appendChild(hint);
+      left.appendChild(canvasWrap);
+
+      // (preview grid removed)
+
+      // (controls removed; erase button is overlayed on canvas)
+
+      // (prediction panel removed; predictions rendered next to output nodes)
+
+      // SVG network on right
+      const svg = d3.select(right).append('svg').attr('width','100%').style('display','block');
+      const defs = svg.append('defs');
+      const gRoot = svg.append('g');
+      const gInput = gRoot.append('g').attr('class','input');
+      const gInputLinks = gRoot.append('g').attr('class','input-links');
+      const gLinks = gRoot.append('g').attr('class','links');
+      const gNodes = gRoot.append('g').attr('class','nodes');
+      const gLabels = gRoot.append('g').attr('class','labels');
+      const gOutText = gRoot.append('g').attr('class','out-probs');
+
+      // Network structure (compact: 8 -> 8 -> 10)
+      const layerSizes = [8, 8, 10];
+      const layers = layerSizes.map((n, li)=> Array.from({length:n}, (_, i)=>({ id:`L${li}N${i}`, layer: li, index: i, a:0 })));
+      // Links only between hidden->hidden and hidden->output
+      const links = [];
+      for (let i=0;i<layerSizes[0];i++){
+        for (let j=0;j<layerSizes[1];j++) links.push({ s:{l:0,i}, t:{l:1,j}, w: (Math.sin(i*17+j*31)+1)/2 });
+      }
+      for (let i=0;i<layerSizes[1];i++){
+        for (let j=0;j<layerSizes[2];j++) links.push({ s:{l:1,i}, t:{l:2,j}, w: (Math.cos(i*7+j*13)+1)/2 });
+      }
+
+      // Linear classifier: logits = W * feats + b, feats in [0,1]
+      // features: [total, cx, cy, lr, tb, htrans, vtrans, loopiness]
+      const W = [
+        // 0  1    2    3    4    5      6      7
+        [ 0.3, 0.0, 0.0, 0.0, 0.0, -0.8, -0.6,  1.2], // 0
+        [-0.2, 0.9, 0.2, 0.8, 0.1, -0.2,  0.2, -1.1], // 1
+        [ 0.1, 0.4, 0.2, 0.5, 0.2,  0.9,  0.1, -0.6], // 2
+        [ 0.2, 0.3, 0.2, 0.2, 0.2,  0.9,  0.0, -0.2], // 3
+        [ 0.0,-0.3, 0.2,-0.6, 0.4,  0.2,  0.8, -0.6], // 4
+        [ 0.1,-0.4, 0.2,-0.5, 0.5,  0.9,  0.1, -0.6], // 5
+        [ 0.2,-0.2, 0.6,-0.2, 0.8, -0.3,  0.2,  0.6], // 6
+        [ 0.0, 0.6,-0.2, 0.6,-0.8,  0.6,  0.0, -0.8], // 7
+        [ 0.4, 0.0, 0.0, 0.1, 0.1,  0.6,  0.6,  1.0], // 8
+        [ 0.2, 0.2,-0.6, 0.2,-0.8,  0.2,  0.6,  0.5], // 9
+      ];
+      const b = [-0.2, -0.1, -0.05, -0.05, -0.05, -0.05, -0.05, -0.1, -0.15, -0.1];
+
+      function computeFeatures(x28){
+        // x28: Float32Array length 784, values in [0,1] (1 = black/ink)
+        let sum=0, cx=0, cy=0; const w=28, h=28;
+        const rowSum = new Array(h).fill(0); const colSum = new Array(w).fill(0);
+        let hTransitions=0, vTransitions=0;
+        for (let y=0;y<h;y++){
+          for (let x=0;x<w;x++){
+            const v = x28[y*w+x]; sum += v; cx += x*v; cy += y*v; rowSum[y]+=v; colSum[x]+=v;
+            if (x>0){ const v0=x28[y*w+(x-1)], v1=v; if ((v0>0.25)!==(v1>0.25)) hTransitions+=1; }
+            if (y>0){ const v0=x28[(y-1)*w+x], v1=v; if ((v0>0.25)!==(v1>0.25)) vTransitions+=1; }
+          }
+        }
+        const total = sum/(w*h); // [0,1]
+        const cxn = sum>1e-6 ? (cx/sum)/(w-1) : 0.5; // [0,1]
+        const cyn = sum>1e-6 ? (cy/sum)/(h-1) : 0.5; // [0,1]
+        let left=0,right=0,top=0,bottom=0;
+        for (let y=0;y<h;y++){ for (let x=0;x<w;x++){ const v=x28[y*w+x]; if (x<w/2) left+=v; else right+=v; if (y<h/2) top+=v; else bottom+=v; }}
+        const lr = (right/(right+left+1e-6));
+        const tb = (bottom/(bottom+top+1e-6));
+        const htn = Math.min(1, hTransitions/(w*h*0.35));
+        const vtn = Math.min(1, vTransitions/(w*h*0.35));
+        // Loopiness proxy: ink near perimeter low vs center high
+        let perimeter=0, center=0; const m=5;
+        for (let y=0;y<h;y++){
+          for (let x=0;x<w;x++){
+            const v=x28[y*w+x];
+            const isBorder = (x<m||x>=w-m||y<m||y>=h-m);
+            if (isBorder) perimeter+=v; else center+=v;
+          }
+        }
+        const loopiness = Math.min(1, center/(perimeter+center+1e-6)*1.8);
+        return [total, cxn, cyn, lr, tb, htn, vtn, loopiness];
+      }
+
+      function softmax(arr){ const m=Math.max(...arr); const ex=arr.map(v=>Math.exp(v-m)); const s=ex.reduce((a,b)=>a+b,0)+1e-12; return ex.map(v=>v/s); }
+      function l2norm(a){ return Math.hypot(...a) || 0; }
+      function normalize(a){ const n=l2norm(a); return n>0 ? a.map(v=>v/n) : a.slice(); }
+      function cosine(a,b){ let s=0; for (let i=0;i<a.length;i++) s+=a[i]*b[i]; const na=l2norm(a), nb=l2norm(b)||1; return na>0 ? s/(na*nb) : 0; }
+
+      // MNIST-like normalization: crop to tight bbox, scale into 20x20, center in 28x28
+      function normalize28(x28){
+        const w=28,h=28, thr=0.2;
+        let minX=29,minY=29,maxX=-1,maxY=-1, sum=0, cx=0, cy=0;
+        for (let y=0;y<h;y++){
+          for (let x=0;x<w;x++){
+            const v = x28[y*w+x];
+            if (v>thr){ if (x<minX) minX=x; if (x>maxX) maxX=x; if (y<minY) minY=y; if (y>maxY) maxY=y; }
+            sum += v; cx += x*v; cy += y*v;
+          }
+        }
+        if (sum < 1e-3 || maxX<0){ return x28; }
+        const comX = cx/sum, comY = cy/sum;
+        const bw = Math.max(1, maxX-minX+1), bh = Math.max(1, maxY-minY+1);
+        const scale = 20/Math.max(bw, bh);
+        const out = new Float32Array(w*h);
+        // center of canvas
+        const cxOut = (w-1)/2, cyOut = (h-1)/2;
+        for (let y=0;y<h;y++){
+          for (let x=0;x<w;x++){
+            // map output pixel to source space around COM
+            const sx = (x - cxOut)/scale + comX;
+            const sy = (y - cyOut)/scale + comY;
+            out[y*w+x] = bilinearSample(x28, w, h, sx, sy);
+          }
+        }
+        return out;
+      }
+      function bilinearSample(img, w, h, x, y){
+        const x0 = Math.floor(x), y0 = Math.floor(y);
+        const x1 = x0+1, y1 = y0+1;
+        const tx = x - x0, ty = y - y0;
+        function at(ix,iy){ if (ix<0||iy<0||ix>=w||iy>=h) return 0; return img[iy*w+ix]; }
+        const v00 = at(x0,y0), v10 = at(x1,y0), v01 = at(x0,y1), v11 = at(x1,y1);
+        const a = v00*(1-tx)+v10*tx; const b = v01*(1-tx)+v11*tx; return a*(1-ty)+b*ty;
+      }
+      // Simple dilation (max-pooling 3x3) to thicken strokes
+      function dilate28(x){
+        const w=28,h=28; const out=new Float32Array(w*h);
+        for (let y=0;y<h;y++){
+          for (let x0=0;x0<w;x0++){
+            let m=0;
+            for (let dy=-1;dy<=1;dy++){
+              for (let dx=-1;dx<=1;dx++){
+                const xx=x0+dx, yy=y+dy; if (xx<0||yy<0||xx>=w||yy>=h) continue;
+                const v = x[yy*w+xx]; if (v>m) m=v;
+              }
+            }
+            out[y*w+x0]=m;
+          }
+        }
+        return out;
+      }
+
+      // Glyph-based 28x28 prototypes for digits 0-9 (normalized)
+      const protoGlyphs28 = [];
+      (function buildGlyphProtos(){
+        const off = document.createElement('canvas'); off.width = CANVAS_PX; off.height = CANVAS_PX;
+        const c = off.getContext('2d');
+        for (let d=0; d<10; d++){
+          c.fillStyle = '#ffffff'; c.fillRect(0,0,off.width,off.height);
+          c.fillStyle = '#000000'; c.textAlign='center'; c.textBaseline='middle';
+          c.font = 'bold 180px system-ui, -apple-system, Segoe UI, Roboto, Arial, sans-serif';
+          c.fillText(String(d), off.width/2, off.height*0.56);
+          const src = c.getImageData(0,0,off.width,off.height).data; const block = off.width/28;
+          const vec = new Float32Array(28*28);
+          for (let gy=0; gy<28; gy++){
+            for (let gx=0; gx<28; gx++){
+              let acc=0, cnt=0; const x0=Math.floor(gx*block), y0=Math.floor(gy*block);
+              for (let yy=y0; yy<y0+block; yy++){
+                for (let xx=x0; xx<x0+block; xx++){
+                  const idx=(yy*off.width+xx)*4; const r=src[idx], g=src[idx+1], b=src[idx+2];
+                  const gray=(r+g+b)/3/255; acc += (1-gray); cnt++;
+                }
+              }
+              vec[gy*28+gx] = acc/(cnt||1);
+            }
+          }
+          const normed = normalize28(vec);
+          const n = l2norm(normed)||1; protoGlyphs28.push(normed.map(v=>v/n));
+        }
+      })();
+      function dot(a,b){ let s=0; for (let i=0;i<a.length;i++) s+=a[i]*b[i]; return s; }
+
+      // Resize handling and node layout
+      let width=640, height=360; const margin = { top: 16, right: 8, bottom: 24, left: 8 };
+      let inputGrid = { cell: 0, x: 0, y: 0, width: 0, height: 0 };
+      function layoutNodes(){
+        // Right panel width, and a non-square aspect ratio for clarity
+        width = Math.max(280, Math.round(right.clientWidth || 640));
+        height = Math.max(260, Math.round(width * 0.56));
+        svg.attr('width', width).attr('height', height);
+        // Match canvas height to SVG height so both columns align vertically
+        try { canvas.style.height = '100%'; canvasWrap.style.height = height + 'px'; } catch(_) {}
+        const innerW = width - margin.left - margin.right; const innerH = height - margin.top - margin.bottom;
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        // Input grid layout (28x28) at left — cap width to a fraction of innerW
+        const maxGridFrac = 0.28; // at most 28% of available width
+        const cellByHeight = Math.floor(innerH / 28);
+        const cellByWidth = Math.floor((innerW * maxGridFrac) / 28);
+        let cell = Math.max(3, Math.min(cellByHeight, cellByWidth));
+        let gridH = cell * 28; let gridY = Math.floor((innerH - gridH)/2);
+        inputGrid = { cell, x: 0, y: gridY, width: cell*28, height: gridH };
+        // Equal horizontal gaps: grid -> L0 -> L1 -> L2
+        const nLayers = layerSizes.length; // 3
+        const rightLabelPad = 36; // smaller pad; use more width for spreading layers
+        const minGap = 28; const maxGap = 260;
+        // Ensure enough free space; shrink grid if needed
+        const desiredMinFree = rightLabelPad + nLayers * minGap; // 3 equal gaps
+        if (inputGrid.width + desiredMinFree > innerW) {
+          cell = Math.max(3, Math.floor((innerW - desiredMinFree) / 28));
+          gridH = cell * 28; gridY = Math.floor((innerH - gridH)/2);
+          inputGrid = { cell, x: 0, y: gridY, width: cell*28, height: gridH };
+        }
+        const gridRight = inputGrid.x + inputGrid.width;
+        const freeW = Math.max(nLayers * minGap, innerW - gridRight - rightLabelPad);
+        const gapX = Math.min(maxGap, Math.max(minGap, Math.floor(freeW / nLayers)));
+        const xs = Array.from({ length: nLayers }, (_, li) => gridRight + gapX * (li + 1));
+        // Y positions evenly spaced per layer
+        layers.forEach((nodes, li)=>{
+          const n = nodes.length;
+          if (n <= 1) {
+            nodes.forEach((nd)=>{ nd.x = xs[li]; nd.y = innerH/2; });
+          } else {
+            const occupancy = 0.9; // use 90% of vertical space
+            const span = innerH * occupancy;
+            const topPad = (innerH - span) / 2;
+            const spacing = span / (n - 1);
+            nodes.forEach((nd, i)=>{ nd.x = xs[li]; nd.y = topPad + i*spacing; });
+          }
+        });
+      }
+
+      let lastX28 = new Float32Array(28*28);
+      function nodeRadiusForNode(n){
+        const a = Math.max(0, Math.min(1, (n && typeof n.a === 'number') ? n.a : 0));
+        if (n && n.layer === 2) {
+          // Output nodes: variable radius based on activation
+          return 8 + 10 * a; // ~8–18
+        }
+        // Hidden/feature nodes: variable radius based on activation
+        return 5 + 5 * a; // ~5–10
+      }
+      function renderInputGrid(){
+        if (!inputGrid || inputGrid.cell <= 0) return;
+        const data = Array.from({ length: 28*28 }, (_, i) => ({ i, v: lastX28[i] || 0 }));
+        const sel = gInput.selectAll('rect.input-px').data(data, d=>d.i);
+        const gap = Math.max(1, Math.floor(inputGrid.cell * 0.10));
+        const inner = Math.max(1, inputGrid.cell - gap);
+        const offset = Math.floor(gap / 2);
+        sel.enter().append('rect').attr('class','input-px')
+          .attr('width', inner).attr('height', inner)
+          .merge(sel)
+          .attr('x', d => inputGrid.x + (d.i % 28) * inputGrid.cell + offset)
+          .attr('y', d => inputGrid.y + Math.floor(d.i / 28) * inputGrid.cell + offset)
+          .attr('fill', d => {
+            // Increase perceived contrast of the input grid by applying a gamma curve
+            const k = Math.pow(Math.max(0, Math.min(1, d.v)), 0.6); // gamma < 1 → darker darks
+            const g = 255 - Math.round(k * 255);
+            return `rgb(${g},${g},${g})`;
+          })
+          .attr('stroke', 'none');
+        sel.exit().remove();
+
+        // Border around the input grid area
+        const borderSel = gInput.selectAll('rect.input-border').data([0]);
+        borderSel.enter().append('rect').attr('class','input-border')
+          .attr('fill','none')
+          .attr('rx', 0).attr('ry', 0)
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-opacity', 0.25)
+          .attr('stroke-width', 1)
+          .lower()
+          .merge(borderSel)
+          .attr('x', inputGrid.x-1)
+          .attr('y', inputGrid.y-1)
+          .attr('width', inputGrid.width+1)
+          .attr('height', inputGrid.height+1);
+
+        // Centered label above the input grid
+        const labelSel = gInput.selectAll('text.input-label').data([0]);
+        labelSel.enter().append('text').attr('class','input-label')
+          .attr('text-anchor','middle')
+          .style('font-size','12px')
+          .style('font-weight','700')
+          .style('fill','var(--muted-color)')
+          .merge(labelSel)
+          .attr('x', inputGrid.x + inputGrid.width / 2)
+          .attr('y', Math.max(12, inputGrid.y - 10))
+          .text('Input 28×28');
+      }
+
+      // Compute link path between two layered nodes using their current radii
+      function computeLinkD(d){
+        const s = layers[d.s.l][d.s.i];
+        const t = layers[d.t.l][d.t.j];
+        if (!s || !t) return '';
+        const rs = nodeRadiusForNode(s);
+        const rt = nodeRadiusForNode(t);
+        // Use fixed anchors on circle edges for all inter-layer links (except grid->L0 handled elsewhere)
+        const x1 = s.x + rs, y1 = s.y;    // right edge of source circle
+        const x2 = t.x - rt, y2 = t.y;    // left edge of target circle
+        const dx = (x2 - x1) * 0.45;
+        return `M${x1},${y1} C${x1+dx},${y1} ${x2-dx},${y2} ${x2},${y2}`;
+      }
+
+      function renderInputLinks(){
+        // Draw bundle-like links from input grid right edge to first layer nodes (features)
+        const firstLayer = layers[0];
+        if (!firstLayer || !inputGrid || inputGrid.cell <= 0) { gInputLinks.selectAll('path').remove(); return; }
+        const x0 = inputGrid.x + inputGrid.width;
+        // Define a centered vertical band (half grid height) and distribute sources evenly
+        const k = firstLayer.length;
+        const band = inputGrid.height * 0.5;
+        const centerY = inputGrid.y + inputGrid.height / 2;
+        const yStart = centerY - band / 2;
+        const spacing = k > 1 ? band / (k - 1) : 0;
+        const paths = firstLayer.map((n, idx) => {
+          // source y from centered band, equidistant
+          const y0 = k > 1 ? (yStart + idx * spacing) : centerY;
+          // Target anchor: center of left edge of the node circle
+          const r = nodeRadiusForNode(n);
+          const x1 = n.x - r;
+          const y1 = n.y;
+          const dx = (x1 - x0) * 0.35;
+          return { x0, y0, x1, y1, c1x: x0 + dx, c1y: y0, c2x: x1 - dx, c2y: y1, idx };
+        });
+        const sel = gInputLinks.selectAll('path.input-link').data(paths);
+        sel.enter().append('path').attr('class','input-link')
+          .attr('fill','none')
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-opacity', 0.25)
+          .attr('stroke-width', 1)
+          .attr('stroke-linecap','round')
+          .merge(sel)
+          .attr('d', d => `M${d.x0},${d.y0} C${d.c1x},${d.c1y} ${d.c2x},${d.c2y} ${d.x1},${d.y1}`)
+          .attr('stroke','var(--text-color)');
+        sel.exit().remove();
+      }
+
+      // Recompute input link path on the fly (used when node radii change)
+      function computeInputLinkD(idx){
+        const firstLayer = layers[0];
+        const n = firstLayer[idx]; if (!n) return '';
+        const x0 = inputGrid.x + inputGrid.width;
+        const k = firstLayer.length;
+        const band = inputGrid.height * 0.5;
+        const centerY = inputGrid.y + inputGrid.height / 2;
+        const yStart = centerY - band / 2;
+        const spacing = k > 1 ? band / (k - 1) : 0;
+        const y0 = k > 1 ? (yStart + idx * spacing) : centerY;
+        const yTarget = n.y;
+        const vx = n.x - x0; const vy = yTarget - y0; const L = Math.hypot(vx, vy) || 1;
+        const r = nodeRadiusForNode(n);
+        const x1 = n.x - (vx / L) * r;
+        const y1 = yTarget - (vy / L) * r;
+        const dx = (x1 - x0) * 0.35;
+        const c1x = x0 + dx, c1y = y0, c2x = x1 - dx, c2y = y1;
+        return `M${x0},${y0} C${c1x},${c1y} ${c2x},${c2y} ${x1},${y1}`;
+      }
+
+      function renderGraph(showEdges){
+        layoutNodes();
+        renderInputGrid();
+        renderInputLinks();
+        // Nodes
+        const allNodes = layers.flat();
+        const nodeSel = gNodes.selectAll('circle.node').data(allNodes, d=>d.id);
+        nodeSel.enter().append('circle').attr('class','node')
+          .attr('r', 10)
+          .attr('cx', d=>d.x).attr('cy', d=>d.y)
+          .attr('fill', d=> d.layer===2 ? 'var(--page-bg)' : 'var(--primary-color)')
+          .attr('fill-opacity', d=> d.layer===2 ? 1 : 0.12)
+          .attr('stroke', d=> d.layer===2 ? 'var(--border-color)' : 'var(--border-color)')
+          .attr('stroke-width',1)
+          .attr('stroke-linejoin','round')
+          .merge(nodeSel)
+          .attr('cx', d=>d.x).attr('cy', d=>d.y)
+          .attr('opacity', 1);
+        nodeSel.exit().remove();
+
+        // Labels for first hidden layer only (avoid stacking with output probs)
+        const labels = [];
+        layers[0].forEach((n,i)=> labels.push({ x:n.x-30, y:n.y+4, txt:`f${i+1}` }));
+        const labSel = gLabels.selectAll('text').data(labels);
+        labSel.enter().append('text')
+          .style('font-size','10px')
+          .style('fill','var(--muted-color)')
+          .style('paint-order','stroke')
+          .style('stroke','var(--page-bg)')
+          .style('stroke-width','3px')
+          .attr('x', d=>d.x)
+          .attr('y', d=>d.y)
+          .text(d=>d.txt)
+          .merge(labSel)
+          .style('paint-order','stroke')
+          .style('stroke','var(--page-bg)')
+          .style('stroke-width','5px')
+          .attr('x', d=>d.x)
+          .attr('y', d=>d.y)
+          .text(d=>d.txt);
+        labSel.exit().remove();
+
+        // Links as smooth curves
+        const linkSel = gLinks.selectAll('path.link').data(links, d=> `${d.s.l}-${d.s.i}-${d.t.l}-${d.t.j}`);
+        linkSel.enter().append('path').attr('class','link')
+          .attr('d', computeLinkD)
+          .attr('fill','none')
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-opacity', 0.25)
+          .attr('stroke-width', d=> 0.5 + d.w*1.2)
+          .attr('stroke-linecap','round')
+          .merge(linkSel)
+          .attr('d', computeLinkD)
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-width', d=> 0.5 + d.w*1.2);
+        linkSel.exit().remove();
+
+        // Ensure output labels remain aligned with the last layer on resize
+        gOutText.selectAll('g.out-label')
+          .attr('transform', function(d){
+            if (!d || typeof d.digit !== 'number') return d3.select(this).attr('transform');
+            const n = layers[2][d.digit];
+            if (!n) return d3.select(this).attr('transform');
+            const offset = nodeRadiusForNode(n) + 8;
+            return `translate(${n.x + offset},${n.y})`;
+          });
+        // Ensure clip-path circles are updated on resize
+        if (defs) {
+          const clips = defs.selectAll('clipPath.clip-node').data(layers[2], d=>d.id);
+          const ce = clips.enter().append('clipPath').attr('class','clip-node').attr('clipPathUnits','userSpaceOnUse').attr('id', d=>`clip-${d.id}`);
+          ce.append('circle');
+          clips.merge(ce).select('circle').attr('cx', d=>d.x).attr('cy', d=>d.y).attr('r', d=>nodeRadiusForNode(d));
+          clips.exit().remove();
+        }
+      }
+
+      function setNodeActivations(h1, h2, out){
+        layers[0].forEach((n,i)=> n.a = h1[i] || 0);
+        layers[1].forEach((n,i)=> n.a = h2[i] || 0);
+        layers[2].forEach((n,i)=> n.a = out[i] || 0);
+        // Determine top prediction (for ghosting others)
+        let argmaxIdx = 0; let bestProb = -1;
+        if (Array.isArray(out)) {
+          for (let i=0;i<out.length;i++){ if (out[i] > bestProb){ bestProb = out[i]; argmaxIdx = i; } }
+        }
+        // Color/size by activation with smooth transitions
+        gNodes.selectAll('circle.node')
+          .transition().duration(180).ease(d3.easeCubicOut)
+          .attr('fill', d=> d.layer===2 ? 'var(--page-bg)' : 'var(--primary-color)')
+          .attr('fill-opacity', d=> d.layer===2 ? 1 : (0.12 + 0.58*Math.min(1, d.a||0)))
+          .attr('stroke', 'var(--primary-color)')
+          .attr('stroke-opacity', d=> (d.layer===2 ? 0.9 : (0.45 + 0.45*Math.min(1, d.a||0))))
+          .attr('opacity', d=> 0.55 + 0.45*Math.min(1, d.a||0))
+          .attr('r', d=> nodeRadiusForNode(d));
+        // Link opacity by activation flow
+        gLinks.selectAll('path.link')
+          .transition().duration(180).ease(d3.easeCubicOut)
+          .attr('d', computeLinkD)
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-opacity', d=>{
+            const aS = layers[d.s.l][d.s.i].a || 0; const aT = layers[d.t.l][d.t.j].a || 0;
+            return Math.min(1, 0.15 + 0.85 * (aS * aT));
+          })
+          .attr('stroke-width', d=>{
+            const aS = layers[d.s.l][d.s.i].a || 0; const aT = layers[d.t.l][d.t.j].a || 0;
+            return 0.6 + 2.2*(aS*aT);
+          });
+        // Theme-aware and activation-aware input links
+        gInputLinks.selectAll('path.input-link')
+          .transition().duration(180).ease(d3.easeCubicOut)
+          .attr('d', (d)=> computeInputLinkD(d.idx))
+          .attr('stroke','var(--text-color)')
+          .attr('stroke-opacity', 0.25)
+          .attr('stroke-width', d=> 0.6 + 2.0*(layers[0][d.idx] ? (layers[0][d.idx].a||0) : 0));
+        // Update clip-path circles to match new radii/positions of output nodes
+        if (defs) {
+          const clips = defs.selectAll('clipPath.clip-node').data(layers[2], d=>d.id);
+          clips.select('circle')
+            .transition().duration(180).ease(d3.easeCubicOut)
+            .attr('cx', d=>d.x)
+            .attr('cy', d=>d.y)
+            .attr('r', d=> nodeRadiusForNode(d));
+        }
+        // Theme-aware input links on updates handled above via transition
+        // Output labels: digit placed to the right of the node
+        const outs = layers[2].map((n,i)=>({ x:n.x + nodeRadiusForNode(n) + 8, y:n.y, digit: i, prob: (out[i]||0), isTop: i===argmaxIdx }));
+        const gSel = gOutText.selectAll('g.out-label').data(outs, d=>d.digit);
+        const gEnter = gSel.enter().append('g').attr('class','out-label');
+        gEnter.append('text').attr('class','out-digit')
+          .style('font-size','12px').style('font-weight','800').style('fill','var(--text-color)')
+          .attr('text-anchor','start').attr('dominant-baseline','middle')
+          .style('paint-order','stroke').style('stroke','var(--transparent-page-contrast)').style('stroke-width','3px');
+        const merged = gEnter.merge(gSel)
+          .attr('transform', d=>`translate(${d.x},${d.y})`)
+          .each(function(d){
+            const sel = d3.select(this);
+            sel.select('text.out-digit')
+              .attr('x', 0).attr('y', 0)
+              .text(String(d.digit));
+            // Ghost non-top predictions
+            sel.style('opacity', d.isTop ? 1 : 0.35);
+          });
+        // Remove any previous decorative rings (no highlight ring desired)
+        gRoot.selectAll('circle.top-ring').remove();
+        // (tooltip interactions removed)
+        gSel.exit().remove();
+
+        // Output liquid fill using clipPath + rect from bottom
+        const rects = gNodes.selectAll('rect.out-liquid').data(layers[2], d=>d.id);
+        const rectEnter = rects.enter().append('rect').attr('class','out-liquid')
+          .attr('fill','var(--primary-color)')
+          .attr('fill-opacity', 0.55)
+          .attr('clip-path', d => `url(#clip-${d.id})`);
+        rectEnter.merge(rects)
+          .transition().duration(180).ease(d3.easeCubicOut)
+          .attr('x', d=> d.x - nodeRadiusForNode(d))
+          .attr('width', d=> 2 * nodeRadiusForNode(d))
+          .attr('y', d=> {
+            const r = nodeRadiusForNode(d);
+            const h = 2 * r * Math.max(0, Math.min(1, d.a||0));
+            return d.y + r - h;
+          })
+          .attr('height', d=> 2 * nodeRadiusForNode(d) * Math.max(0, Math.min(1, d.a||0)))
+          .attr('fill-opacity', 0.55);
+        rects.exit().remove();
+      }
+
+      // (no separate updateBars; bars are rendered next to nodes)
+
+      function runPipeline(){
+        const x28raw = downsample28();
+        const x28 = dilate28(normalize28(x28raw));
+        // Update input grid data
+        lastX28 = x28;
+        renderInputGrid();
+        const feats = computeFeatures(x28); // 8D in [0,1]
+        const inkMass = feats[0];
+        // Hide hint when user has drawn something
+        if (hint) { hint.style.opacity = inkMass < 0.01 ? 1 : 0; }
+        // Hidden 1 = raw features
+        const h1 = feats;
+        // Hidden 2 = simple non-linear mix for visualization only
+        const h2 = layers[1].map((_, j)=>{
+          let s=0; for (let i=0;i<layers[0].length;i++){ const w = (Math.sin(i*17+j*31)+1)/2 * 0.8 + 0.1; s += w*h1[i]; }
+          return Math.tanh(s*0.8);
+        });
+        let prob;
+        if (inkMass < 0.03){
+          // Too little ink: return near-uniform distribution
+          prob = Array.from({length:10}, ()=> 1/10);
+        } else {
+          // Prefer TFJS model if available
+          const tfProbs = predictTfjs(x28);
+          if (tfProbs && tfProbs.length === 10) {
+            prob = tfProbs;
+          } else {
+            // Fallback: rely mostly on glyph similarity
+            const x28n = normalize(x28);
+            const logitsGlyph = protoGlyphs28.map(p => 8.0 * cosine(x28n, p));
+            const logitsLinear = W.map((row, k)=> dot(row, h1) + b[k]);
+            const logits = logitsGlyph.map((v,k)=> v + 0.2*logitsLinear[k]);
+            prob = softmax(logits);
+          }
+        }
+        setNodeActivations(h1, h2.map(v => (v+1)/2), prob);
+      }
+
+      function downsample28(){
+        // From canvas (224x224) to 28x28 by average pooling in 8x8 blocks
+        const block = CANVAS_PX/28; // 8
+        const src = ctx.getImageData(0,0,CANVAS_PX,CANVAS_PX).data;
+        const out = new Float32Array(28*28);
+        for (let gy=0; gy<28; gy++){
+          for (let gx=0; gx<28; gx++){
+            let acc=0; let cnt=0;
+            const x0 = Math.floor(gx*block), y0 = Math.floor(gy*block);
+            for (let y=y0; y<y0+block; y++){
+              for (let x=x0; x<x0+block; x++){
+                const idx = (y*CANVAS_PX + x)*4; // RGBA
+                const r=src[idx], g=src[idx+1], b=src[idx+2];
+                const gray = (r+g+b)/3/255; // 1: white, 0: black
+                const ink = 1-gray; // 1: ink/black
+                acc += ink; cnt++;
+              }
+            }
+            out[gy*28+gx] = acc/(cnt||1);
+          }
+        }
+        return out;
+      }
+
+      function clearCanvas(){ ctx.fillStyle = '#ffffff'; ctx.fillRect(0,0,CANVAS_PX,CANVAS_PX); runPipeline(); }
+
+      // Drawing interactions
+      let drawing=false; let last=null;
+      let hasInteracted=false;
+      const getPos = (ev) => {
+        const rect = canvas.getBoundingClientRect();
+        const sx = CANVAS_PX/rect.width; const sy = CANVAS_PX/rect.height;
+        const x = (('touches' in ev)? ev.touches[0].clientX : ev.clientX) - rect.left;
+        const y = (('touches' in ev)? ev.touches[0].clientY : ev.clientY) - rect.top;
+        return { x: x*sx, y: y*sy };
+      };
+      function drawTo(p){
+        const size = 24;
+        ctx.lineCap='round'; ctx.lineJoin='round'; ctx.strokeStyle='#000000'; ctx.lineWidth=size;
+        if (!last) last = p;
+        ctx.beginPath(); ctx.moveTo(last.x, last.y); ctx.lineTo(p.x, p.y); ctx.stroke();
+        last = p; runPipeline();
+      }
+      function onDown(ev){
+        drawing=true; last=null;
+        if (!hasInteracted){ hasInteracted=true; try { eraseBtn.style.display = 'flex'; } catch(_) {} }
+        drawTo(getPos(ev)); ev.preventDefault();
+      }
+      function onMove(ev){ if (!drawing) return; drawTo(getPos(ev)); ev.preventDefault(); }
+      function onUp(){ drawing=false; last=null; }
+      canvas.addEventListener('mousedown', onDown); canvas.addEventListener('mousemove', onMove); window.addEventListener('mouseup', onUp);
+      canvas.addEventListener('touchstart', onDown, { passive:false }); canvas.addEventListener('touchmove', onMove, { passive:false }); window.addEventListener('touchend', onUp);
+
+      // (erase button handled as overlay)
+      const rerender = () => { renderGraph(true); };
+      if (window.ResizeObserver) {
+        const ro = new ResizeObserver(()=>rerender());
+        ro.observe(right);
+        ro.observe(canvas);
+      } else { window.addEventListener('resize', rerender); }
+
+      // TFJS model (optional)
+      let tfModel = null;
+      const tryLoadModel = async () => {
+        await new Promise((res)=> ensureTF(res));
+        const candidates = [
+          // Prefer public path via symlink to assets/data
+          '/data/mnist-variant-model.json',
+          // Fallbacks to relative copies under content assets (shards must be colocated)
+          './assets/data/mnist-variant-model.json',
+          '../assets/data/mnist-variant-model.json',
+          '/assets/data/mnist-variant-model.json',
+          // Fallback to public TFJS MNIST
+          'https://storage.googleapis.com/tfjs-models/tfjs/mnist/model.json'
+        ];
+        for (const u of candidates){
+          try { tfModel = await tf.loadLayersModel(u); return; } catch(_) { /* try next */ }
+        }
+        tfModel = null;
+      };
+
+      function predictTfjs(x28){
+        if (!tfModel || !window.tf) return null;
+        const run = (arr) => {
+          const t = tf.tidy(()=> tf.tensor(arr, [28,28,1]).expandDims(0));
+          try { const y = tfModel.predict(t); const p = y.softmax(); const out = Array.from(p.dataSync()); tf.dispose([y,p,t]); return out; } catch(e){ tf.dispose(t); return null; }
+        };
+        // Try both orientations and keep the one with higher confidence
+        const p1 = run(x28);
+        const inv = x28.map(v=>1-v);
+        const p2 = run(inv);
+        let probs = p1 || p2;
+        if (p1 && p2){
+          const m1 = Math.max(...p1), m2 = Math.max(...p2);
+          probs = m2>m1 ? p2 : p1;
+        }
+        if (!probs) return null;
+        // Normalize output size to 10 classes (pad or slice)
+        if (probs.length < 10){ probs = probs.concat(Array(10 - probs.length).fill(0)); }
+        if (probs.length > 10){ probs = probs.slice(0,10); }
+        return probs;
+      }
+
+      // Initial render
+      renderGraph(true);
+      clearCanvas();
+      tryLoadModel();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
+
+
diff --git a/app/src/content/embeds/d3-pie-quad.html b/app/src/content/embeds/d3-pie-quad.html
new file mode 100644
index 0000000000000000000000000000000000000000..8730990f25ad444b03d8ee433f781998444ed826
--- /dev/null
+++ b/app/src/content/embeds/d3-pie-quad.html
@@ -0,0 +1,347 @@
+<div class="d3-pie-quad"></div>
+<style>
+  /* Layout piloté par container queries (par rapport au parent) */
+  .d3-pie-quad { container-type: inline-size; }
+  .d3-pie-quad .legend { width: 80%;margin: 0 auto; font-size: 12px; line-height: 1.35; color: var(--text-color); }
+  .d3-pie-quad .legend { margin-bottom: 32px; }
+  .d3-pie-quad .legend .items { display:flex; flex-wrap:wrap; gap:8px 14px; align-items:center; justify-content:center; }
+  .d3-pie-quad .legend .item { display:flex; align-items:center; gap:8px; white-space:nowrap; }
+  .d3-pie-quad .legend .swatch { width:14px; height:14px; border-radius:3px; display:inline-block; border: 1px solid var(--border-color); }
+  .d3-pie-quad .legend .title { display:block; text-align:center; font-weight:800; margin-bottom:6px; }
+  .d3-pie-quad .caption { font-size: 14px; font-weight: 800; fill: var(--text-color); }
+  .d3-pie-quad .caption-subtitle { font-size: 11px; font-weight: 400; fill: var(--muted-color); }
+  .d3-pie-quad .nodata { font-size: 12px; fill: var(--muted-color); }
+  /* Ghost legend items when hovering slices */
+  .d3-pie-quad.hovering .legend .item.ghost { opacity: .35; }
+  .d3-pie-quad .slice-label { font-size: 11px; font-weight: 700; fill: var(--text-color); paint-order: stroke; stroke: var(--transparent-page-contrast); stroke-width: 3px; }
+  /* Effet ghost synchronisé */
+  .d3-pie-quad .slice {
+    transition: opacity .15s ease;
+  }
+  .d3-pie-quad.hovering .slice.ghost {
+    opacity: .25;
+  }
+  /* Layout HTML (pas JS) pour la grille et les cellules */
+  .d3-pie-quad .plots-grid {
+    display: flex;
+    flex-wrap: wrap;
+    justify-content: center;
+    align-items: flex-start;
+    gap: 12px 20px;
+    margin-top: 4px;
+    margin-left: auto;
+    margin-right: auto;
+    width: 100%;
+  }
+  /* Par défaut (flux ~1280): 2 colonnes centrées */
+  .content-grid .d3-pie-quad .plots-grid { width: 100%; }
+  .content-grid .d3-pie-quad .pie-cell { flex: 0 0 calc((100% - 20px)/2); }
+  /* En wrappers larges: viser 4 colonnes si l'espace le permet */
+  .wide .d3-pie-quad .plots-grid,
+  .full-width .d3-pie-quad .plots-grid { width: 100%; }
+  .wide .d3-pie-quad .pie-cell,
+  .full-width .d3-pie-quad .pie-cell { flex: 0 0 calc((100% - 60px)/4); }
+  /* Forcer 2 colonnes dans le flux lorsque le parent ~1280px */
+  .content-grid .d3-pie-quad .plots-grid { width: min(740px, 100%); }
+  .d3-pie-quad .pie-cell {
+    display: flex;
+    flex-direction: column;
+    align-items: center;
+    flex: 0 0 360px; /* 2 colonnes fixes dans le flux à 1280px */
+  }
+  /* 4/2/1 colonnes en fonction de la largeur du parent */
+  /* @container (min-width: 740px) {
+    .d3-pie-quad .plots-grid { width: 740px; }
+  }
+  @container (max-width: 739.98px) {
+    .d3-pie-quad .plots-grid { width: 100%; }
+  } */
+  @media (max-width: 500px) {
+    .d3-pie-quad .pie-cell { flex: 0 0 100%; }
+  }
+  /* Tooltip styling aligned with filters-quad */
+  .d3-pie-quad .d3-tooltip {
+    z-index: var(--z-elevated);
+    backdrop-filter: saturate(1.12) blur(8px);
+  }
+  .d3-pie-quad .d3-tooltip__inner {
+    display: flex;
+    flex-direction: column;
+    gap: 6px;
+    min-width: 220px;
+  }
+  .d3-pie-quad .d3-tooltip__inner > div:first-child {
+    font-weight: 800;
+    letter-spacing: 0.1px;
+    margin-bottom: 0;
+  }
+  .d3-pie-quad .d3-tooltip__inner > div:nth-child(2) {
+    font-size: 11px;
+    color: var(--muted-color);
+    display: block;
+    margin-top: -4px;
+    margin-bottom: 2px;
+    letter-spacing: 0.1px;
+  }
+  .d3-pie-quad .d3-tooltip__inner > div:nth-child(n+3) {
+    padding-top: 6px;
+    border-top: 1px solid var(--border-color);
+  }
+  .d3-pie-quad .d3-tooltip__color-dot {
+    display: inline-block;
+    width: 12px;
+    height: 12px;
+    border-radius: 3px;
+    border: 1px solid var(--border-color);
+  }
+</style>
+<script>
+  (() => {
+    const THIS_SCRIPT = document.currentScript;
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = THIS_SCRIPT;
+      const host = scriptEl && scriptEl.parentElement;
+      let container = null;
+      if (host && host.querySelector) {
+        container = host.querySelector('.d3-pie-quad');
+      }
+      if (!container) {
+        let sib = scriptEl && scriptEl.previousElementSibling;
+        while (sib && !(sib.classList && sib.classList.contains('d3-pie-quad'))) {
+          sib = sib.previousElementSibling;
+        }
+        container = sib || document.querySelector('.d3-pie-quad');
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'10px 12px', borderRadius:'12px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 8px 32px rgba(0,0,0,.28), 0 2px 8px rgba(0,0,0,.12)', opacity:'0', transition:'opacity .12s ease',
+          zIndex: 'var(--z-elevated)', backdropFilter: 'saturate(1.12) blur(8px)'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // HTML scaffolding: legend and plots grid as HTML; only pies are SVG
+      const legendHost = document.createElement('div'); legendHost.className = 'legend'; container.appendChild(legendHost);
+      const plotsHost = document.createElement('div'); plotsHost.className = 'plots-grid'; container.appendChild(plotsHost);
+
+      // Metrics (order and labels as in the Python script)
+      const METRICS = [
+        { key:'answer_total_tokens', name:'Answer Tokens', title:'Weighted by ', letter:'a' },
+        { key:'total_samples',       name:'Number of Samples', title:'Weighted by ', letter:'b' },
+        { key:'total_turns',         name:'Number of Turns', title:'Weighted by ', letter:'c' },
+        { key:'total_images',        name:'Number of Images', title:'Weighted by ', letter:'d' }
+      ];
+
+      // CSV: load from public path
+      const CSV_PATHS = [
+        '/data/vision.csv'
+      ];
+
+      const fetchFirstAvailable = async (paths) => {
+        for (const p of paths) {
+          try {
+            const res = await fetch(p, { cache: 'no-cache' });
+            if (res.ok) { return await res.text(); }
+          } catch (_) { /* try next */ }
+        }
+        throw new Error('CSV not found: vision.csv');
+      };
+
+      const parseCsv = (text) => d3.csvParse(text, (d) => ({
+        subset_name: (d['subset_name']||'').trim(),
+        eagle_cathegory: (d['eagle_cathegory']||'').trim(),
+        answer_total_tokens: +((d['answer_total_tokens']||'0').toString().trim()) || 0,
+        total_samples: +((d['total_samples']||'0').toString().trim()) || 0,
+        total_turns: +((d['total_turns']||'0').toString().trim()) || 0,
+        total_images: +((d['total_images']||'0').toString().trim()) || 0
+      }));
+
+      // Layout
+      let width=800; const margin = { top: 8, right: 24, bottom: 0, left: 24 };
+      const CAPTION_GAP = 36;   // espace entre titre et donut
+      const GAP_X = 20;         // espace entre colonnes
+      const GAP_Y = 12;         // espace entre lignes
+      const TOP_OFFSET = 4;     // décalage vertical supplémentaire pour aérer le haut
+      const DONUT_INNER_RATIO = 0.58; // ratio du trou central (0 = pie plein, 0.5 = moitié)
+      // LEGEND_GAP supprimé: l'espacement est désormais géré en CSS via .d3-pie-quad .legend { margin-bottom }
+      const SVG_VPAD = 16;      // padding vertical supplémentaire à l'intérieur des SVG pour éviter la coupe
+      
+      const updateSize = () => {
+        width = container.clientWidth || 800;
+        return { innerWidth: width - margin.left - margin.right };
+      };
+
+      function renderLegend(categories, colorOf){
+        legendHost.style.display = 'flex';
+        legendHost.style.alignItems = 'center';
+        legendHost.style.justifyContent = 'center';
+        legendHost.innerHTML = `<div class="items">${categories.map(c => `<div class="item" data-category="${c}"><span class=\"swatch\" style=\"background:${colorOf(c)}\"></span><span style=\"font-weight:500\">${c}</span></div>`).join('')}</div>`;
+      }
+
+      function drawPies(rows){
+        const { innerWidth } = updateSize();
+
+        // Catégories (triées) + échelle de couleurs harmonisée avec banner.html
+        const categories = Array.from(new Set(rows.map(r => r.eagle_cathegory || 'Unknown'))).sort();
+        const getCatColors = (n) => {
+          try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') return window.ColorPalettes.getColors('categorical', n); } catch(_) {}
+          return (d3.schemeTableau10 ? d3.schemeTableau10.slice(0, n) : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'].slice(0, n));
+        };
+        const color = d3.scaleOrdinal().domain(categories).range(getCatColors(categories.length));
+        const colorOf = (cat) => color(cat || 'Unknown');
+
+        // Clear plots grid
+        plotsHost.innerHTML = '';
+
+        // Légende au-dessus, centrée
+        renderLegend(categories, colorOf);
+
+        // Rayon fixé selon la largeur cible d'une cellule (gérée par CSS)
+        const CELL_BASIS = 360; // doit correspondre à .pie-cell { flex-basis }
+        const radius = Math.max(80, Math.min(120, Math.floor(CELL_BASIS * 0.42)));
+        const innerR = Math.round(radius * DONUT_INNER_RATIO);
+        // Placement géré par CSS; ici on ne fait que l'espacement vertical minimal
+        plotsHost.style.position = 'relative';
+        plotsHost.style.marginTop = (TOP_OFFSET) + 'px';
+
+        const pie = d3.pie().sort(null).value(d => d.value).padAngle(0.02);
+        const arc = d3.arc().innerRadius(innerR).outerRadius(radius).cornerRadius(3);
+        const arcLabel = d3.arc().innerRadius((innerR + radius) / 2).outerRadius((innerR + radius) / 2);
+
+        // Légende déjà rendue au-dessus
+
+        METRICS.forEach((metric, idx) => {
+          // Aggregate by category
+          const totals = new Map(); categories.forEach(c => totals.set(c, 0));
+          rows.forEach(r => { totals.set(r.eagle_cathegory, totals.get(r.eagle_cathegory) + (r[metric.key] || 0)); });
+          const values = categories.map(c => ({ category: c, value: totals.get(c) || 0 }));
+          const nonZeroValues = values.filter(v => (v.value || 0) > 0);
+          const totalSum = d3.sum(nonZeroValues, d => d.value);
+
+          // Create HTML cell container
+          const cell = document.createElement('div');
+          cell.className = 'pie-cell';
+          cell.style.width = (radius * 2) + 'px';
+          cell.style.height = (radius * 2 + SVG_VPAD * 2 + CAPTION_GAP + 24) + 'px';
+          cell.style.display = 'flex';
+          cell.style.flexDirection = 'column';
+          cell.style.alignItems = 'center';
+          cell.style.justifyContent = 'flex-start';
+          plotsHost.appendChild(cell);
+
+          // SVG pie inside cell
+          const svg = d3.select(cell).append('svg').attr('width', radius * 2).attr('height', radius * 2 + SVG_VPAD * 2).style('display','block');
+          const gCell = svg.append('g').attr('transform', `translate(${radius},${radius + SVG_VPAD})`);
+
+          if (!totalSum || totalSum <= 0 || nonZeroValues.length === 0) {
+            gCell.append('text').attr('class','nodata').attr('text-anchor','middle').attr('dy','0').text('No data for this metric');
+          } else {
+            const data = pie(nonZeroValues);
+            const percent = (v) => (v / totalSum) * 100;
+
+            // Slices
+            const slices = gCell.selectAll('path.slice').data(data).enter().append('path').attr('class','slice')
+              .attr('d', arc)
+              .attr('fill', d => colorOf(d.data.category))
+              .attr('stroke', 'var(--surface-bg)')
+              .attr('stroke-width', 1.2)
+              .attr('data-category', d => d.data.category)
+              .on('mouseenter', function(ev, d){
+                const hoveredCategory = d.data.category;
+                d3.select(container).classed('hovering', true);
+                d3.select(container).selectAll('path.slice').classed('ghost', s => (s.data && s.data.category) !== hoveredCategory);
+                // Ghost legend items that are not hovered
+                d3.select(legendHost).selectAll('.item').classed('ghost', function(){ return this.dataset && this.dataset.category !== hoveredCategory; });
+                d3.select(this).attr('stroke', 'rgba(0,0,0,0.85)').attr('stroke-width', 1);
+                const p = percent(d.data.value);
+                const catColor = colorOf(d.data.category);
+                let html = `<div style="display:flex;align-items:center;gap:8px;white-space:nowrap;"><span class=\"d3-tooltip__color-dot\" style=\"background:${catColor}\"></span><strong>${d.data.category}</strong></div>`;
+                html += `<div>${metric.name}</div>`;
+                html += `<div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><strong>Value</strong><span style="margin-left:auto;text-align:right;">${d.data.value.toLocaleString()}</span></div>`;
+                /* Share row removed per request */
+                tipInner.innerHTML = html;
+                tip.style.opacity = '1';
+              })
+              .on('mousemove', function(ev){
+                const [mx, my] = d3.pointer(ev, container); const offsetX = 12, offsetY = 12; tip.style.transform = `translate(${Math.round(mx+offsetX)}px, ${Math.round(my+offsetY)}px)`;
+              })
+              .on('mouseleave', function(){
+                tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)';
+                d3.select(container).classed('hovering', false);
+                d3.select(container).selectAll('path.slice').classed('ghost', false);
+                d3.select(legendHost).selectAll('.item').classed('ghost', false);
+                d3.select(this).attr('stroke','var(--surface-bg)');
+              });
+
+            // Percentage labels (>= 3%)
+            gCell.selectAll('text.slice-label').data(data.filter(d => percent(d.data.value) >= 3)).enter()
+              .append('text').attr('class','slice-label').style('pointer-events','none')
+              .attr('transform', d => `translate(${arcLabel.centroid(d)})`)
+              .attr('text-anchor','middle')
+              .text(d => `${percent(d.data.value).toFixed(1)}%`);
+          }
+
+          // HTML captions under the SVG (keep design)
+          const subtitleEl = document.createElement('div'); subtitleEl.className = 'caption-subtitle'; subtitleEl.textContent = metric.title; subtitleEl.style.textAlign = 'center'; cell.appendChild(subtitleEl);
+          const titleEl = document.createElement('div'); titleEl.className = 'caption'; titleEl.textContent = metric.name; titleEl.style.textAlign = 'center'; cell.appendChild(titleEl);
+        });
+
+        // Container height flows naturally with HTML; nothing to do
+
+        // Reset global hover/ghost when leaving the plots area
+        plotsHost.onmouseleave = () => {
+          tip.style.opacity='0';
+          tip.style.transform='translate(-9999px, -9999px)';
+          d3.select(container).classed('hovering', false);
+          d3.select(container).selectAll('path.slice').classed('ghost', false);
+          d3.select(legendHost).selectAll('.item').classed('ghost', false);
+        };
+      }
+
+      async function init(){
+        try {
+          const text = await fetchFirstAvailable(CSV_PATHS);
+          const rows = parseCsv(text);
+          drawPies(rows);
+
+          // Resize handling
+          const rerender = () => drawPies(rows);
+          if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); }
+          else { window.addEventListener('resize', rerender); }
+        } catch (err) {
+          const pre = document.createElement('pre'); pre.textContent = (err && err.message) ? err.message : String(err);
+          pre.style.color = 'var(--danger, #b00020)'; pre.style.fontSize = '12px'; pre.style.whiteSpace = 'pre-wrap';
+          container.appendChild(pre);
+        }
+      }
+
+      init();
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
+
+
+
+
diff --git a/app/src/content/embeds/d3-pie.html b/app/src/content/embeds/d3-pie.html
new file mode 100644
index 0000000000000000000000000000000000000000..80c520b0ec81243fcfa79b682adae24c3c72fcbe
--- /dev/null
+++ b/app/src/content/embeds/d3-pie.html
@@ -0,0 +1,154 @@
+<div class="d3-pie"></div>
+<style>
+  .d3-pie { position: relative; }
+  .d3-pie .legend { display:flex; flex-direction:column; align-items:flex-start; gap:6px; margin: 8px 0 0 0; font-size:12px; color: var(--text-color); }
+  .d3-pie .legend .legend-title { font-size:12px; font-weight:700; color: var(--text-color); }
+  .d3-pie .legend .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .d3-pie .legend .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .d3-pie .legend .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); }
+  /* Ghost legend items when hovering slices */
+  .d3-pie.hovering .legend .item.ghost { opacity: .35; }
+  /* Ghost effect on slices */
+  .d3-pie .slice { transition: opacity .15s ease; }
+  .d3-pie.hovering .slice.ghost { opacity: .25; }
+  /* Labels with contrast liseret */
+  .d3-pie .slice-label { font-size: 11px; font-weight: 700; fill: var(--text-color); paint-order: stroke; stroke: var(--transparent-page-contrast); stroke-width: 3px; }
+  .d3-pie .d3-tooltip { position:absolute; top:0; left:0; transform:translate(-9999px,-9999px); pointer-events:none; padding:8px 10px; border-radius:8px; font-size:12px; line-height:1.35; border:1px solid var(--border-color); background:var(--surface-bg); color:var(--text-color); box-shadow:0 4px 24px rgba(0,0,0,.18); opacity:0; transition:opacity .12s ease; }
+  .d3-pie .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .d3-pie .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; text-align: left; }
+  .d3-pie .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .d3-pie .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .d3-pie .d3-tooltip__inner > div:nth-child(n+3) { padding-top: 6px; border-top: 1px solid var(--border-color); }
+  .d3-pie .d3-tooltip .swatch { width:12px; height:12px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; margin-right:6px; }
+  .d3-pie .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id='d3-cdn-script'; s.src='https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once:true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-pie'))){
+        const cs = Array.from(document.querySelectorAll('.d3-pie')).filter(el => !(el.dataset && el.dataset.mounted==='true'));
+        container = cs[cs.length-1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted==='true') return; container.dataset.mounted='true'; }
+
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) { tip = document.createElement('div'); tip.className = 'd3-tooltip'; tipInner = document.createElement('div'); tipInner.className='d3-tooltip__inner'; tip.appendChild(tipInner); container.appendChild(tip); } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      const legend = document.createElement('div'); legend.className = 'legend'; legend.innerHTML = '<div class="legend-title">Legend</div><div class="items"></div>'; container.appendChild(legend);
+
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+
+      const DEFAULT_CSV = '/data/vision.csv';
+      const fetchFirstAvailable = async (paths) => {
+        for (const p of paths) { try { const r = await fetch(p, { cache:'no-cache' }); if (r.ok) return await r.text(); } catch(_){} }
+        throw new Error('CSV not found: vision.csv');
+      };
+      function parseCsv(text){
+        return d3.csvParse(text, d => ({
+          category: (d['eagle_cathegory']||d['category']||'').trim(),
+          value: +((d['total_samples']||d['value']||'0').toString().trim()) || 0
+        }));
+      }
+
+      let width=800, height=340; const DONUT_INNER_RATIO = 0.6;
+      function updateSize(){
+        width = container.clientWidth || 800; height = Math.max(240, Math.round(width/3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${width/2},${height/2})`);
+        return { inner: Math.min(width, height) * 0.42 };
+      }
+
+      function makeLegend(categories, colorOf){
+        const items = legend.querySelector('.items'); items.innerHTML = '';
+        categories.forEach(name => { const el = document.createElement('span'); el.className='item'; el.dataset.category=name; const sw=document.createElement('span'); sw.className='swatch'; sw.style.background=colorOf(name); const txt=document.createElement('span'); txt.textContent=name; el.appendChild(sw); el.appendChild(txt); items.appendChild(el); });
+      }
+
+      function render(rows){
+        const { inner } = updateSize();
+        const categories = Array.from(new Set(rows.map(r => r.category || 'Unknown'))).sort();
+        const getColors = (n) => { try { if (window.ColorPalettes && typeof window.ColorPalettes.getColors==='function') return window.ColorPalettes.getColors('categorical', n); } catch(_){} return (window.d3 && d3.schemeTableau10) ? d3.schemeTableau10.slice(0, n) : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab'].slice(0,n); };
+        const palette = getColors(categories.length);
+        const color = d3.scaleOrdinal().domain(categories).range(palette);
+        const colorOf = (c) => color(c || 'Unknown');
+
+        makeLegend(categories, colorOf);
+
+        const totals = new Map(); categories.forEach(c => totals.set(c, 0)); rows.forEach(r => totals.set(r.category, (totals.get(r.category)||0) + (r.value||0)));
+        const values = categories.map(c => ({ category:c, value: totals.get(c)||0 })).filter(d => d.value > 0);
+        const sum = d3.sum(values, d=>d.value) || 1;
+
+        const radius = Math.max(60, Math.min(inner, 120));
+        const innerR = Math.round(radius * DONUT_INNER_RATIO);
+        const pie = d3.pie().sort(null).value(d=>d.value).padAngle(0.02);
+        const arc = d3.arc().innerRadius(innerR).outerRadius(radius).cornerRadius(3);
+        const arcLabel = d3.arc().innerRadius((innerR + radius)/2).outerRadius((innerR + radius)/2);
+
+        const data = pie(values);
+        const slices = gRoot.selectAll('path.slice').data(data, d=>d.data.category);
+        slices.enter().append('path').attr('class','slice')
+          .attr('fill', d=>colorOf(d.data.category))
+          .attr('stroke','var(--surface-bg)')
+          .attr('stroke-width',1)
+          .attr('data-category', d => d.data.category)
+          .on('mouseenter', (ev, d) => {
+            const pct = (d.data.value / sum) * 100;
+            container.classList.add('hovering');
+            gRoot.selectAll('path.slice').classed('ghost', s => (s && s.data && s.data.category) !== d.data.category);
+            try { const items = legend.querySelectorAll('.item'); items.forEach(it => it.classList.toggle('ghost', it.dataset.category !== d.data.category)); } catch(_) {}
+            const colorSw = colorOf(d.data.category);
+            tipInner.innerHTML = `<div style="display:flex;align-items:center;gap:8px;white-space:nowrap;"><span class=\"swatch\" style=\"background:${colorSw}\"></span><strong>${d.data.category}</strong></div>` +
+              `<div>Value</div>` +
+              `<div style=\"display:flex;align-items:center;gap:6px;white-space:nowrap;\"><strong>Total</strong><span style=\"margin-left:auto;text-align:right;\">${d.data.value.toLocaleString()} (${pct.toFixed(1)}%)</span></div>`;
+            tip.style.opacity='1';
+          })
+          .on('mousemove', (ev) => { const [mx,my] = d3.pointer(ev, container); tip.style.transform = `translate(${Math.round(mx+12)}px, ${Math.round(my+12)}px)`; })
+          .on('mouseleave', () => {
+            tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)';
+            container.classList.remove('hovering');
+            gRoot.selectAll('path.slice').classed('ghost', false);
+            try { const items = legend.querySelectorAll('.item'); items.forEach(it => it.classList.remove('ghost')); } catch(_) {}
+          })
+          .merge(slices)
+          .attr('d', arc)
+          .attr('fill', d=>colorOf(d.data.category));
+        slices.exit().remove();
+
+        const labels = gRoot.selectAll('text.slice-label').data(data.filter(d => (d.data.value/sum) >= 0.03), d=>d.data.category);
+        labels.enter().append('text').attr('class','slice-label').attr('text-anchor','middle')
+          .merge(labels)
+          .attr('transform', d => `translate(${arcLabel.centroid(d)})`)
+          .text(d => `${((d.data.value/sum)*100).toFixed(1)}%`);
+        labels.exit().remove();
+      }
+
+      (async () => {
+        try {
+          const text = await fetchFirstAvailable([DEFAULT_CSV, './assets/data/vision.csv', '../assets/data/vision.csv']);
+          const rows = parseCsv(text);
+          render(rows);
+          const rerender = () => render(rows);
+          if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.textContent = (e && e.message) ? e.message : String(e); pre.style.color='var(--danger, #b00020)'; pre.style.fontSize='12px'; pre.style.whiteSpace='pre-wrap'; container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState==='loading'){ document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once:true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
diff --git a/app/src/content/embeds/d3-scatter.html b/app/src/content/embeds/d3-scatter.html
new file mode 100644
index 0000000000000000000000000000000000000000..895cd77adbc6e04dbdf25f1128aa6b6098ab3819
--- /dev/null
+++ b/app/src/content/embeds/d3-scatter.html
@@ -0,0 +1,300 @@
+<div class="d3-scatter"  ></div>
+<style>
+  /* Frameless: no controls, no axes, only dots */
+  .d3-scatter svg { display: block; }
+  /* Tooltip refined styling (align with filters-quad) */
+  .d3-scatter .d3-tooltip {
+    z-index: 20;
+    backdrop-filter: saturate(1.12) blur(8px);
+  }
+  .d3-scatter .d3-tooltip__inner {
+    display: flex;
+    flex-direction: column;
+    gap: 6px;
+    min-width: 200px;
+  }
+  .d3-scatter .d3-tooltip__inner > div:first-child {
+    font-weight: 800;
+    letter-spacing: 0.1px;
+    margin-bottom: 0;
+  }
+  .d3-scatter .d3-tooltip__inner > div:nth-child(2) {
+    font-size: 11px;
+    color: var(--muted-color);
+    display: block;
+    margin-top: -4px;
+    margin-bottom: 2px;
+    letter-spacing: 0.1px;
+  }
+  .d3-scatter .d3-tooltip__inner > div:nth-child(n+3) {
+    padding-top: 6px;
+    border-top: 1px solid var(--border-color);
+  }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-scatter'))){
+        const cs = Array.from(document.querySelectorAll('.d3-scatter')).filter(el => !(el.dataset && el.dataset.mounted==='true'));
+        container = cs[cs.length-1] || null;
+      }
+      if (!container) return;
+      if (container.dataset){ if (container.dataset.mounted==='true') return; container.dataset.mounted='true'; }
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, { position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none', padding:'10px 12px', borderRadius:'12px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)', background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 8px 32px rgba(0,0,0,.28), 0 2px 8px rgba(0,0,0,.12)', opacity:'0', transition:'opacity .12s ease', backdropFilter:'saturate(1.12) blur(8px)' });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // SVG
+      const svg = d3.select(container).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gDots = gRoot.append('g').attr('class','dots');
+      const gCentroids = gRoot.append('g').attr('class','centroids');
+      const gLegend = gRoot.append('foreignObject').attr('class','legend');
+
+      // State & scales
+      let width=800, height=360; const margin = { top: 8, right: 12, bottom: 8, left: 12 };
+      const x = d3.scaleLinear();
+      const y = d3.scaleLinear();
+      const color = d3.scaleOrdinal();
+      const radius = () => 4;
+      let isDarkMode = false;
+      function getDotStrokeColor(fillColor = null){ 
+        if (!fillColor) return 'var(--muted-color)';
+        
+        // Résoudre les variables CSS en couleurs réelles
+        let resolvedColor = fillColor;
+        if (fillColor.startsWith('var(')) {
+          const tempEl = document.createElement('div');
+          tempEl.style.color = fillColor;
+          document.body.appendChild(tempEl);
+          resolvedColor = getComputedStyle(tempEl).color;
+          document.body.removeChild(tempEl);
+        }
+        
+        try {
+          const colorObj = d3.color(resolvedColor);
+          if (!colorObj) return 'var(--muted-color)';
+          
+          // En mode light: bordure plus claire, en mode dark: bordure plus sombre
+          return isDarkMode ? 
+            colorObj.darker(0.3).toString() : 
+            colorObj.brighter(0.8).toString();
+        } catch {
+          return 'var(--muted-color)';
+        }
+      }
+
+      // Data loading (real): banner visualization positions by category
+      async function fetchFirstAvailable(paths){
+        for (const p of paths){
+          try {
+            const res = await fetch(p, { cache: 'no-cache' });
+            if (res.ok){ return await res.text(); }
+          } catch (e) {}
+        }
+        throw new Error('Failed to load data from provided paths');
+      }
+
+      let data = [];
+      let categories = [];
+      let colorMode = 'group';
+
+      function renderLegend(innerWidth){ gLegend.remove(); }
+
+      function updateScales(data){
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        isDarkMode = !!isDark;
+        const axisColor = "var(--page-bg)";
+        const tickColor = "var(--page-bg)";
+        const gridColor = "var(--page-bg)";
+
+        width = container.clientWidth || 800; height = Math.max(260, Math.round(width/3)); svg.attr('width', width).attr('height', height);
+        const innerWidth = width - margin.left - margin.right; const innerHeight = height - margin.top - margin.bottom; gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+
+        const xExtent = d3.extent(data, d=>d.x);
+        const yExtent = d3.extent(data, d=>d.y);
+        x.domain([xExtent[0], xExtent[1]]).range([0, innerWidth]).nice();
+        y.domain([yExtent[0], yExtent[1]]).range([innerHeight, 0]).nice();
+
+        // Frameless: no grid, no axes
+        gGrid.selectAll('*').remove();
+        gAxes.selectAll('*').remove();
+
+        renderLegend(innerWidth);
+
+        return { innerWidth, innerHeight };
+      }
+
+      function refreshPalette(){
+        try {
+          const cats = categories && categories.length ? categories.length : 6;
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            const arr = window.ColorPalettes.getColors('categorical', cats) || [];
+            if (arr && arr.length) { color.range(arr); return; }
+          }
+          // fallback
+          color.range((d3.schemeTableau10 ? d3.schemeTableau10 : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab']).slice(0, cats));
+        } catch {
+          const cats = categories && categories.length ? categories.length : 6;
+          color.range((d3.schemeTableau10 ? d3.schemeTableau10 : ['#4e79a7','#f28e2b','#e15759','#76b7b2','#59a14f','#edc948','#b07aa1','#ff9da7','#9c755f','#bab0ab']).slice(0, cats));
+        }
+        // Recolor existing marks/labels after palette changes
+        try { if (data && data.length) draw(); } catch {}
+      }
+
+      function draw(){
+        if (!data || !data.length) return;
+        const { innerWidth, innerHeight } = updateScales(data);
+        const fillFor = d => colorMode === 'group' ? color(d.group) : 'var(--primary-color)';
+
+        const dots = gDots.selectAll('circle.dot').data(data, (d,i)=>d.id || i);
+        dots.enter().append('circle').attr('class','dot')
+          .attr('cx', d=>x(d.x)).attr('cy', d=>y(d.y)).attr('r', radius())
+          .attr('fill', fillFor).attr('fill-opacity', 0.85)
+          .attr('stroke', d => getDotStrokeColor(fillFor(d))).attr('stroke-width', '0.75px')
+          .on('mouseenter', function(ev, d){
+            d3.select(this).style('stroke','var(--text-color)').style('stroke-width','1.5px').attr('fill-opacity', 1);
+            const swatch = `<svg width="10" height="10" viewBox="0 0 10 10" aria-hidden="true"><circle cx="5" cy="5" r="5" fill="${fillFor(d)}" /></svg>`;
+            tipInner.innerHTML = `
+              <div><strong>${d.label || 'Item'}</strong></div>
+              <div style="display:flex;align-items:center;gap:6px;">${swatch}<span>${d.group}</span></div>
+              <div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><strong>x</strong><span style="margin-left:auto;text-align:right;">${d.x.toFixed(2)}</span></div>
+              <div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><strong>y</strong><span style="margin-left:auto;text-align:right;">${d.y.toFixed(2)}</span></div>`;
+            tip.style.opacity = '1';
+          })
+          .on('mousemove', function(ev){ const [mx, my] = d3.pointer(ev, container); const ox=12, oy=12; tip.style.transform = `translate(${Math.round(mx+ox)}px, ${Math.round(my+oy)}px)`; })
+          .on('mouseleave', function(ev, d){ tip.style.opacity='0'; tip.style.transform='translate(-9999px, -9999px)'; d3.select(this).style('stroke', getDotStrokeColor(fillFor(d))).style('stroke-width','0.75px').attr('fill-opacity', 0.85); })
+          .merge(dots)
+          .transition().duration(180)
+          .attr('cx', d=>x(d.x)).attr('cy', d=>y(d.y)).attr('r', radius())
+          .attr('fill', fillFor).attr('fill-opacity', 0.85)
+          .attr('stroke', d => getDotStrokeColor(fillFor(d))).attr('stroke-width','0.75px');
+        dots.exit().remove();
+
+        // Compute centroids per category
+        const centroids = Array.from(
+          d3.rollup(
+            data,
+            (v) => ({
+              category: v[0] ? v[0].group : 'Unknown',
+              x: d3.mean(v, (d) => d.x),
+              y: d3.mean(v, (d) => d.y),
+              count: v.length
+            }),
+            (d) => d.group
+          ).values()
+        );
+
+        // Map to pixel space nodes for collision-avoiding label placement
+        const nodes = centroids.map((c) => ({
+          category: c.category,
+          count: c.count,
+          targetX: x(c.x),
+          targetY: y(c.y),
+          x: x(c.x),
+          y: y(c.y),
+          width: Math.max(18, (String(c.category || '').length || 6) * 11),
+          height: 16
+        }));
+
+        if (nodes.length > 1) {
+          const sim = d3.forceSimulation(nodes)
+            .force('x', d3.forceX((d) => d.targetX).strength(0.9))
+            .force('y', d3.forceY((d) => d.targetY).strength(0.9))
+            .force('collide', d3.forceCollide((d) => Math.hypot(d.width/2, d.height/2) + 15))
+            .stop();
+          for (let i = 0; i < 650; i++) sim.tick();
+          const maxOffset = 45;
+          nodes.forEach((n) => {
+            const dx = n.x - n.targetX, dy = n.y - n.targetY; const dist = Math.hypot(dx, dy);
+            if (dist > maxOffset && dist > 0) { const s = maxOffset / dist; n.x = n.targetX + dx * s; n.y = n.targetY + dy * s; }
+          });
+        }
+
+        const labels = gCentroids.selectAll('g.centroid').data(nodes, d => d.category || 'Unknown');
+        const enter = labels.enter().append('g').attr('class','centroid').attr('pointer-events','none');
+        enter.append('text').attr('class','label-bg').attr('text-anchor','middle').attr('dominant-baseline','middle');
+        enter.append('text').attr('class','label-fg').attr('text-anchor','middle').attr('dominant-baseline','middle');
+        const merged = enter.merge(labels);
+        merged
+          .attr('transform', d => `translate(${Math.round(d.x)}, ${Math.round(d.y)})`)
+          .each(function(d){
+            const base = color(d.category || 'Unknown') || 'var(--text-color)';
+            const bg = getComputedStyle(document.documentElement).getPropertyValue('--page-bg').trim() || '#fff';
+            const bgNode = this.querySelector('text.label-bg');
+            const fgNode = this.querySelector('text.label-fg');
+            if (bgNode) {
+              bgNode.textContent = d.category;
+              bgNode.style.setProperty('fill', "var(--page-bg)", 'important');
+              bgNode.style.setProperty('stroke', "var(--page-bg)");
+              bgNode.style.setProperty('stroke-width', '8px');
+              bgNode.style.setProperty('paint-order', 'stroke fill');
+              bgNode.style.setProperty('font-weight','800');
+              bgNode.style.setProperty('font-size','16px');
+            }
+            if (fgNode) {
+              fgNode.textContent = d.category;
+              fgNode.style.setProperty('fill', base, 'important');
+              fgNode.style.setProperty('font-weight','800');
+              fgNode.style.setProperty('font-size','16px');
+            }
+          });
+        labels.exit().remove();
+      }
+
+      // Initial load
+      refreshPalette();
+      document.addEventListener('palettes:updated', refreshPalette);
+
+      (async () => {
+        try {
+          const csvText = await fetchFirstAvailable([
+            '/data/banner_visualisation_data.csv',
+            './assets/data/banner_visualisation_data.csv',
+            '../assets/data/banner_visualisation_data.csv',
+            '/data/banner_visualisation_data.csv'
+          ]);
+          const rows = d3.csvParse(csvText);
+          data = rows.map((r, i) => ({
+            id: +r.original_id ?? i,
+            x: +r.x_position,
+            y: +r.y_position,
+            group: r.category || 'Unknown',
+            label: r.subset || r.category || `Item ${i+1}`
+          })).filter(d => Number.isFinite(d.x) && Number.isFinite(d.y));
+          categories = Array.from(new Set(data.map(d=>d.group)));
+          color.domain(categories);
+          draw();
+        } catch (e) {
+          const pre = document.createElement('pre'); pre.style.color = 'crimson'; pre.textContent = 'Failed to load scatter data.'; container.appendChild(pre);
+        }
+      })();
+
+      const rerender = () => { draw(); };
+      if (window.ResizeObserver) { const ro = new ResizeObserver(()=>rerender()); ro.observe(container); } else { window.addEventListener('resize', rerender); }
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/demo/color-picker.html b/app/src/content/embeds/demo/color-picker.html
new file mode 100644
index 0000000000000000000000000000000000000000..3cd1eaf960868ff23534f5c6daa62484ad647947
--- /dev/null
+++ b/app/src/content/embeds/demo/color-picker.html
@@ -0,0 +1,226 @@
+<div class="color-picker" style="width:100%; margin: 10px 0;">
+  <style>
+    .color-picker .picker__stack { display:flex; flex-direction:column; gap:12px; }
+    .color-picker .current-card { display:grid; grid-template-columns: 30% 70%; align-items: center; gap:14px; padding:14px 32px 14px 16px; border:1px solid var(--border-color); background: var(--surface-bg); border-radius: 12px; }
+    .color-picker .current-left { display:flex; flex-direction: column; gap:8px; min-width: 0; }
+    .color-picker .current-right { display:flex; flex-direction: column; gap:8px; padding-left: 14px; border-left: 1px solid var(--border-color); }
+    .color-picker .current-main { display:flex; align-items:center; gap:12px; min-width: 0; }
+    .color-picker .current-swatch { width: 32px; height: 32px; border-radius: 8px; border: 1px solid var(--border-color); }
+    .color-picker .current-text { display:flex; flex-direction: column; line-height: 1.2; min-width: 0; }
+    .color-picker .current-name { font-size: 14px; font-weight: 800; color: var(--text-color); white-space: nowrap; overflow: hidden; text-overflow: ellipsis; max-width: clamp(140px, 28vw, 260px); }
+    .color-picker .current-hex, .color-picker .current-extra { font-size: 11px; color: var(--muted-color); letter-spacing: .02em; white-space: nowrap; overflow: hidden; text-overflow: ellipsis; max-width: clamp(140px, 28vw, 260px); }
+    /* theme preview styles removed */
+    .color-picker .picker__label { font-weight:700; font-size: 12px; color: var(--muted-color); text-transform: uppercase; letter-spacing: .02em; }
+    .color-picker .hue-slider { position:relative; height:16px; border-radius:10px; border:1px solid var(--border-color); background: linear-gradient(to right, #f00 0%, #ff0 17%, #0f0 33%, #0ff 50%, #00f 67%, #f0f 83%, #f00 100%); cursor: ew-resize; touch-action: none; flex: 1 1 auto; min-width: 200px; }
+    .color-picker .hue-knob { position:absolute; top:50%; left:93.6%; width:14px; height:14px; border-radius:50%; border:2px solid #fff; transform:translate(-50%, -50%); background: var(--surface-bg); z-index: 2; box-shadow: 0 0 0 1px rgba(0,0,0,.05); }
+    .color-picker .hue-slider:focus-visible { outline: 2px solid var(--primary-color); outline-offset: 2px; }
+    .color-picker .hue-value { font-variant-numeric: tabular-nums; color: var(--muted-color); font-size: 12px; }
+    @media (max-width: 720px) { .color-picker .current-card { grid-template-columns: 1fr; } .color-picker .current-right { padding-left: 0; border-left: none; } }
+  </style>
+  <div class="picker__stack">
+    <div class="current-card">
+      <div class="current-left">
+        <div class="current-main">
+          <div class="current-swatch" aria-label="Current color" title="Current color"></div>
+          <div class="current-text">
+            <div class="current-name">—</div>
+            <div class="current-hex">—</div>
+            <div class="current-extra current-lch">—</div>
+            <div class="current-extra current-rgb">—</div>
+          </div>
+        </div>
+      </div>
+      <div class="current-right">
+        <div class="picker__label">Hue</div>
+        <div class="hue-slider" role="slider" aria-label="Hue" aria-valuemin="0" aria-valuemax="360" aria-valuenow="337" tabindex="0">
+          <div class="hue-knob"></div>
+        </div>
+        <div class="hue-value">337°</div>
+      </div>
+    </div>
+  </div>
+</div>
+<script>
+  (() => {
+    // Ensure chroma.js is loaded once
+    const ensureChroma = (next) => {
+      if (window.chroma) return next();
+      const loadScript = (id, src, onload, onerror) => {
+        let s = document.getElementById(id);
+        if (s) { return onload && onload(); }
+        s = document.createElement('script');
+        s.id = id; s.src = src; s.async = true;
+        if (onload) s.addEventListener('load', onload, { once: true });
+        if (onerror) s.addEventListener('error', onerror, { once: true });
+        document.head.appendChild(s);
+      };
+      loadScript('chroma-cdn', 'https://unpkg.com/chroma-js@2.4.2/dist/chroma.min.js', next, () => {
+        loadScript('chroma-cdn-fallback', 'https://cdnjs.cloudflare.com/ajax/libs/chroma-js/2.4.2/chroma.min.js', next);
+      });
+    };
+
+    // Minimal embedded color-name list (same as palettes)
+    const COLOR_NAMES = [{"name":"Candy Apple Red","hex":"#ff0800"},{"name":"Boiling Magma","hex":"#ff3300"},{"name":"Aerospace Orange","hex":"#ff4f00"},{"name":"Burtuqali Orange","hex":"#ff6700"},{"name":"American Orange","hex":"#ff8b00"},{"name":"Cheese","hex":"#ffa600"},{"name":"Amber","hex":"#ffbf00"},{"name":"Demonic Yellow","hex":"#ffe700"},{"name":"Bat-Signal","hex":"#feff00"},{"name":"Bitter Lime","hex":"#cfff00"},{"name":"Electric Lime","hex":"#ccff00"},{"name":"Bright Yellow Green","hex":"#9dff00"},{"name":"Lasting Lime","hex":"#88ff00"},{"name":"Bright Green","hex":"#66ff00"},{"name":"Chlorophyll Green","hex":"#4aff00"},{"name":"Green Screen","hex":"#22ff00"},{"name":"Electric Pickle","hex":"#00ff04"},{"name":"Acid","hex":"#00ff22"},{"name":"Lucent Lime","hex":"#00ff33"},{"name":"Cathode Green","hex":"#00ff55"},{"name":"Booger Buster","hex":"#00ff77"},{"name":"Green Gas","hex":"#00ff99"},{"name":"Enthusiasm","hex":"#00ffaa"},{"name":"Ice Ice Baby","hex":"#00ffdd"},{"name":"Master Sword Blue","hex":"#00ffee"},{"name":"Agressive Aqua","hex":"#00fbff"},{"name":"Vivid Sky Blue","hex":"#00ccff"},{"name":"Capri","hex":"#00bfff"},{"name":"Sky of Magritte","hex":"#0099ff"},{"name":"Azure","hex":"#007fff"},{"name":"Blue Ribbon","hex":"#0066ff"},{"name":"Blinking Blue","hex":"#0033ff"},{"name":"Icelandic Water","hex":"#0011ff"},{"name":"Blue","hex":"#0000ff"},{"name":"Blue Pencil","hex":"#2200ff"},{"name":"Electric Ultramarine","hex":"#3f00ff"},{"name":"Aladdin's Feather","hex":"#5500ff"},{"name":"Purple Climax","hex":"#8800ff"},{"name":"Amethyst Ganzstar","hex":"#8f00ff"},{"name":"Electric Purple","hex":"#bf00ff"},{"name":"Phlox","hex":"#df00ff"},{"name":"Brusque Pink","hex":"#ee00ff"},{"name":"Bright Magenta","hex":"#ff08e8"},{"name":"Big bang Pink","hex":"#ff00bb"},{"name":"Mean Girls Lipstick","hex":"#ff00ae"},{"name":"Pink","hex":"#ff0099"},{"name":"Hot Flamingoes","hex":"#ff005d"},{"name":"Blazing Dragonfruit","hex":"#ff0054"},{"name":"Carmine Red","hex":"#ff0038"},{"name":"Bright Red","hex":"#ff000d"}];
+    if (!window.__colorNames) window.__colorNames = COLOR_NAMES;
+
+    // Shared event bus so multiple instances stay in sync
+    if (!window.__colorPickerBus) {
+      window.__colorPickerBus = (() => {
+        let hue = 337; // shared initial hue
+        let adjusting = false;
+        const listeners = new Set();
+        return {
+          get: () => ({ hue, adjusting }),
+          publish: (sourceId, nextHue, isAdjusting) => {
+            hue = ((nextHue % 360) + 360) % 360;
+            adjusting = !!isAdjusting;
+            listeners.forEach((fn) => { try { fn({ sourceId, hue, adjusting }); } catch {} });
+          },
+          subscribe: (fn) => { listeners.add(fn); return () => listeners.delete(fn); }
+        };
+      })();
+    }
+
+    const bootstrap = () => {
+      const mount = document.currentScript ? document.currentScript.previousElementSibling : null;
+      const root = mount && mount.closest('.color-picker') ? mount.closest('.color-picker') : document.querySelector('.color-picker');
+      if (!root || root.dataset.mounted) return; root.dataset.mounted = 'true';
+
+      const slider = root.querySelector('.hue-slider');
+      const knob = root.querySelector('.hue-knob');
+      const hueValue = root.querySelector('.hue-value');
+      const currentSwatch = root.querySelector('.current-swatch');
+      const currentName = root.querySelector('.current-name');
+      const currentHex = root.querySelector('.current-hex');
+      const currentLch = root.querySelector('.current-lch');
+      const currentRgb = root.querySelector('.current-rgb');
+
+      const bus = window.__colorPickerBus;
+      const instanceId = Math.random().toString(36).slice(2);
+
+      const getKnobRadius = () => {
+        try { const w = knob ? knob.getBoundingClientRect().width : 0; return w ? w / 2 : 8; } catch { return 8; }
+      };
+
+      const getName = (hex) => {
+        const list = (window.__colorNames && window.__colorNames.length) ? window.__colorNames : COLOR_NAMES;
+        if (list && window.chroma) {
+          let bestName = null; let best = Infinity;
+          for (let i = 0; i < list.length; i++) {
+            const item = list[i];
+            const d = (chroma.deltaE ? chroma.deltaE(hex, item.hex) : chroma.distance(hex, item.hex, 'lab'));
+            if (d < best) { best = d; bestName = item.name; }
+          }
+          if (bestName) return bestName;
+        }
+        const hh = chroma(hex).get('hsl.h') || 0;
+        const labels = ['Red','Orange','Yellow','Lime','Green','Cyan','Blue','Indigo','Violet','Magenta'];
+        const idx = Math.round(((hh % 360) / 360) * (labels.length - 1));
+        return labels[idx];
+      };
+
+      const updateUI = (h, adjusting) => {
+        const rect = slider.getBoundingClientRect();
+        const r = Math.min(getKnobRadius(), Math.max(0, rect.width / 2 - 1));
+        const t = Math.max(0, Math.min(1, (h / 360)));
+        const leftPx = r + t * Math.max(0, (rect.width - 2 * r));
+        if (knob) knob.style.left = (leftPx / rect.width * 100) + '%';
+        if (hueValue) hueValue.textContent = `${Math.round(h)}°`;
+        if (slider) slider.setAttribute('aria-valuenow', String(Math.round(h)));
+        // Use LCH for consistent chroma across hues
+        const L = 70; // lightness
+        const C = 60; // chroma kept within sRGB-friendly range
+        const base = chroma.lch(L, C, h);
+        const baseHex = base.hex();
+        if (currentSwatch) currentSwatch.style.background = baseHex;
+        if (currentName) currentName.textContent = getName(baseHex.toUpperCase());
+        if (currentHex) currentHex.textContent = baseHex.toUpperCase();
+        if (currentLch) {
+          const lc = base.lch();
+          const L = Math.round((lc[0] || 0));
+          const C = Math.round((lc[1] || 0));
+          const H = Math.round(((lc[2] || 0) % 360 + 360) % 360);
+          currentLch.textContent = `LCH ${L}, ${C}, ${H}°`;
+        }
+        if (currentRgb) {
+          const rgb = base.rgb().map(v => Math.round(v));
+          currentRgb.textContent = `RGB ${rgb[0]}, ${rgb[1]}, ${rgb[2]}`;
+        }
+        // Apply to theme (always, to reflect the selection)
+        const hoverL = Math.max(0, Math.min(100, L - 8));
+        const hoverHex = chroma.lch(hoverL, C, h).hex();
+        const rootEl = document.documentElement;
+        rootEl.style.setProperty('--primary-color', baseHex);
+        rootEl.style.setProperty('--primary-color-hover', hoverHex);
+      };
+
+      const getHueFromEvent = (ev) => {
+        const rect = slider.getBoundingClientRect();
+        const clientX = ev.touches ? ev.touches[0].clientX : ev.clientX;
+        const x = clientX - rect.left;
+        const r = Math.min(getKnobRadius(), Math.max(0, rect.width / 2 - 1));
+        const effX = Math.max(r, Math.min(rect.width - r, x));
+        const denom = Math.max(1, rect.width - 2 * r);
+        const t = (effX - r) / denom;
+        return t * 360;
+      };
+
+      // Subscribe to bus to sync multiple instances
+      const unsubscribe = bus.subscribe(({ sourceId, hue, adjusting }) => {
+        if (sourceId === instanceId) return; // avoid feedback
+        updateUI(hue, adjusting);
+      });
+
+      // Init from theme color if available
+      try {
+        const cssPrimary = getComputedStyle(document.documentElement).getPropertyValue('--primary-color').trim();
+        if (cssPrimary) {
+          const initH = chroma(cssPrimary).get('hsl.h') || 0;
+          updateUI(initH, false);
+          bus.publish(instanceId, initH, false);
+        } else {
+          const { hue: sharedHue } = bus.get();
+          updateUI(sharedHue, false);
+        }
+      } catch {
+        const { hue: sharedHue } = bus.get();
+        updateUI(sharedHue, false);
+      }
+
+      const onDown = (ev) => {
+        ev.preventDefault();
+        const h = getHueFromEvent(ev);
+        updateUI(h, true);
+        bus.publish(instanceId, h, true);
+        const move = (e) => { e.preventDefault && e.preventDefault(); const hh = getHueFromEvent(e); updateUI(hh, true); bus.publish(instanceId, hh, true); };
+        const up = () => { bus.publish(instanceId, getHueFromEvent(ev), false); window.removeEventListener('mousemove', move); window.removeEventListener('touchmove', move); window.removeEventListener('mouseup', up); window.removeEventListener('touchend', up); };
+        window.addEventListener('mousemove', move, { passive: false });
+        window.addEventListener('touchmove', move, { passive: false });
+        window.addEventListener('mouseup', up, { once: true });
+        window.addEventListener('touchend', up, { once: true });
+      };
+
+      if (slider) {
+        slider.addEventListener('mousedown', onDown);
+        slider.addEventListener('touchstart', onDown, { passive: false });
+        // Minimal keyboard support (←/→, Shift for larger steps)
+        slider.addEventListener('keydown', (e) => {
+          const step = e.shiftKey ? 10 : 2;
+          if (e.key === 'ArrowLeft') { e.preventDefault(); const { hue } = bus.get(); const h = hue - step; updateUI(h, true); bus.publish(instanceId, h, true); bus.publish(instanceId, h, false); }
+          if (e.key === 'ArrowRight') { e.preventDefault(); const { hue } = bus.get(); const h = hue + step; updateUI(h, true); bus.publish(instanceId, h, true); bus.publish(instanceId, h, false); }
+        });
+      }
+
+      // Clean up on detach (best-effort)
+      const ro = new MutationObserver(() => {
+        if (!document.body.contains(root)) { unsubscribe && unsubscribe(); ro.disconnect(); }
+      });
+      ro.observe(document.body, { childList: true, subtree: true });
+    };
+
+    if (document.readyState === 'loading') document.addEventListener('DOMContentLoaded', () => ensureChroma(bootstrap), { once: true });
+    else ensureChroma(bootstrap);
+  })();
+</script>
+
+
diff --git a/app/src/content/embeds/demo/content-structure.html b/app/src/content/embeds/demo/content-structure.html
new file mode 100644
index 0000000000000000000000000000000000000000..c388ebb897e2528321df178dd9bb888fbe2ac055
--- /dev/null
+++ b/app/src/content/embeds/demo/content-structure.html
@@ -0,0 +1,161 @@
+<div class="cs" role="img" aria-label="Content folder structure: MDX, assets, embeds">
+  <div class="cs__header">
+    <svg class="cs__folder" viewBox="0 0 24 24" preserveAspectRatio="xMidYMid meet" aria-hidden="true">
+      <path d="M4 7h4.5l1.8 2H20"/>
+      <rect x="4" y="9" width="16" height="10" rx="2" ry="2"/>
+    </svg>
+    <span class="cs__path">/app/src/content</span>
+  </div>
+
+  <div class="cs__grid">
+    <div class="cs__box">
+      <div class="cs__box-head">
+        <svg class="cs__icon" viewBox="0 0 24 24" aria-hidden="true">
+          <rect x="3" y="3" width="14" height="18" rx="2" ry="2"/>
+          <path d="M14 3l4 4h-4z"/>
+          <path d="M7 11l-2 2l2 2"/>
+          <path d="M13 11l2 2l-2 2"/>
+          <path d="M10 11v4"/>
+        </svg>
+        <span class="cs__label">MDX</span>
+      </div>
+      <div class="cs__items">
+        <div class="cs__item">article.mdx</div>
+        <div class="cs__item"><a href="#chapters">chapters/</a>*.mdx</div>
+      </div>
+    </div>
+
+    <div class="cs__box">
+      <div class="cs__box-head">
+        <svg class="cs__icon" viewBox="0 0 24 24" aria-hidden="true">
+          <path d="M6 5h10a2 2 0 0 1 2 2v12c-2-.9-4-1.6-6-1.6S8 18.1 6 19V7a2 2 0 0 1 2-2z"/>
+          <path d="M6 9h12"/>
+        </svg>
+        <span class="cs__label">Bib</span>
+      </div>
+      <div class="cs__items">
+        <div class="cs__item">bibliography.bib</div>
+      </div>
+    </div>
+    <div class="cs__box">
+      <div class="cs__box-head">
+        <svg class="cs__icon" viewBox="0 0 24 24" aria-hidden="true">
+          <rect x="3" y="5" width="18" height="14" rx="2" ry="2"/>
+          <circle cx="8" cy="10" r="1.4"/>
+          <path d="M6 16l4-3 2 2 3-2-1 3H6z"/>
+        </svg>
+        <span class="cs__label">assets/</span>
+      </div>
+      <div class="cs__items">
+        <div class="cs__item">audio/</div>
+        <div class="cs__item">image/</div>
+        <div class="cs__item">data/</div>
+      </div>
+    </div>
+
+    <div class="cs__box">
+      <div class="cs__box-head">
+        <svg class="cs__icon" viewBox="0 0 24 24" aria-hidden="true">
+          <path d="M9 16l-4-4l4-4"/>
+          <path d="M15 16l4-4l-4-4"/>
+        </svg>
+        <span class="cs__label">embeds/</span>
+      </div>
+      <div class="cs__items">
+        <div class="cs__item"><a href="#htmlembed">*.html</a></div>
+      </div>
+    </div>
+    
+  </div>
+</div>
+
+<style>
+  .cs {
+    width: 100%;
+    box-sizing: border-box;
+    border: 1px solid var(--border-color);
+    border-radius: 12px;
+    background: var(--surface-bg);
+    color: var(--text-color);
+    padding: 10px 12px 12px;
+    margin-bottom: var(--block-spacing-y);
+  }
+  .cs__header {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    margin: 2px 0 10px 0;
+  }
+  .cs__folder {
+    width: 20px;
+    height: auto;
+    display: block;
+    flex: 0 0 auto;
+    stroke: var(--text-color);
+    fill: none;
+    stroke-width: 1.5;
+    stroke-linecap: round;
+    stroke-linejoin: round;
+    vector-effect: non-scaling-stroke;
+    shape-rendering: geometricPrecision;
+  }
+  .cs__path { font-weight: 600; font-size: 14px; }
+
+  .cs__grid {
+    display: grid;
+    grid-template-columns: repeat(4, minmax(0, 1fr));
+    gap: 12px;
+  }
+
+  .cs__box {
+    border: 1px solid var(--border-color);
+    border-radius: 10px;
+    background: var(--surface-bg);
+    padding: 10px 12px;
+    display: flex;
+    flex-direction: column;
+    min-height: 120px;
+  }
+  .cs__box-head {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    margin-bottom: 8px;
+  }
+  .cs__icon {
+    width: 18px;
+    height: 18px;
+    display: block;
+    stroke: var(--text-color);
+    fill: none;
+    stroke-width: 1.5;
+    stroke-linecap: round;
+    stroke-linejoin: round;
+    vector-effect: non-scaling-stroke;
+    shape-rendering: geometricPrecision;
+  }
+  .cs__label {
+    font-weight: 700;
+    font-size: 13px;
+  }
+  .cs__items {
+    display: grid;
+    gap: 4px;
+  }
+  .cs__item {
+    font-size: 12px;
+    color: var(--muted-color);
+  }
+
+  @media (max-width: 1180px) {
+    .cs__grid {
+      grid-template-columns: repeat(2, minmax(0, 1fr));
+    }
+  }
+  @media (max-width: 620px) {
+    .cs__grid {
+      grid-template-columns: 1fr;
+    }
+  }
+</style>
+
diff --git a/app/src/content/embeds/demo/palettes.html b/app/src/content/embeds/demo/palettes.html
new file mode 100644
index 0000000000000000000000000000000000000000..31850e2706bdb187409061c917a80858d0117277
--- /dev/null
+++ b/app/src/content/embeds/demo/palettes.html
@@ -0,0 +1,219 @@
+<div class="palettes" style="width:100%; margin: 10px 0;">
+  <style>
+    .palettes { box-sizing: border-box; overflow-x: hidden; }
+    .palettes .palettes__grid { display: grid; grid-template-columns: 1fr; gap: 12px; max-width: 100%; }
+    .palettes .palette-card { position: relative; display: grid; grid-template-columns: auto 1fr minmax(0, 220px); align-items: stretch; gap: 12px; border: 1px solid var(--border-color); border-radius: 10px; background: var(--surface-bg); padding: 12px; transition: box-shadow .18s ease, transform .18s ease, border-color .18s ease; }
+    /* removed circular badge */
+    .palettes .palette-card__swatches { display: grid; grid-template-columns: repeat(6, minmax(0, 1fr)); grid-auto-rows: 1fr; gap: 2px; margin: 0; min-height: 20px; }
+    .palettes .palette-card__swatches .sw { width: 100%; min-width: 0; min-height: 0; border-radius: 0; border: 1px solid var(--border-color); }
+    .palettes .palette-card__swatches .sw:first-child { border-top-left-radius: 8px; border-bottom-left-radius: 8px; }
+    .palettes .palette-card__swatches .sw:last-child { border-top-right-radius: 8px; border-bottom-right-radius: 8px; }
+    .palettes .palette-card__content { display: flex; flex-direction: row; align-items: center; justify-content: center; gap: 6px; min-width: 0; padding-right: 0; }
+    .palettes .palette-card__content__info { display: flex; flex-direction: column;  }
+    .palettes .palette-card__title { text-align: left; font-weight: 800; font-size: 15px; }
+    .palettes .palette-card__desc { text-align: left; color: var(--muted-color); line-height: 1.5; font-size: 12px; }
+    .palettes .palette-card__actions { display: flex; align-items: center; justify-content: flex-start; justify-self: start; align-self: stretch; }
+    /* .palettes .copy-btn { margin: 0; padding: 0 10px; height: 100%; border-radius: 8px; } */
+    /* .palettes .copy-btn:hover { background: var(--primary-color); color: var(--on-primary)!important; border-color: transparent; }
+    .palettes .copy-btn:focus-visible { outline: 2px solid var(--primary-color); outline-offset: 2px; } */
+    .palettes .copy-btn svg { width: 18px; height: 18px; fill: currentColor; display: block; }
+    /* Simulation UI */
+    .palettes .palettes__select { width: 100%; max-width: 100%; border: 1px solid var(--border-color); background: var(--surface-bg); color: var(--text-color); padding: 8px 10px; border-radius: 8px; }
+    .palettes .sr-only { position: absolute; width: 1px; height: 1px; padding: 0; margin: -1px; overflow: hidden; clip: rect(0, 0, 1px, 1px); white-space: nowrap; border: 0; }
+    .palettes .palettes__controls { display: flex; flex-wrap: wrap; gap: 16px; align-items: center; margin: 8px 0 14px; }
+    .palettes .palettes__field { display: flex; flex-direction: column; gap: 6px; min-width: 0; flex: 1 1 280px; max-width: 100%; }
+    .palettes .palettes__label { font-size: 12px; color: var(--muted-color); font-weight: 800; }
+    .palettes .palettes__label-row { display: flex; align-items: center; justify-content: space-between; gap: 10px; }
+    .palettes .ghost-badge { font-size: 11px; padding: 1px 6px; border-radius: 999px; border: 1px solid var(--border-color); color: var(--muted-color); background: transparent; font-variant-numeric: tabular-nums; }
+    .palettes .palettes__count { display: flex; align-items: center; gap: 8px; max-width: 100%; }
+    .palettes .palettes__count input[type="range"] { width: 100%; }
+    .palettes .palettes__count output { min-width: 28px; text-align: center; font-variant-numeric: tabular-nums; font-size: 12px; color: var(--muted-color); }
+    /* Slider styling */
+    .palettes input[type="range"] { -webkit-appearance: none; appearance: none; height: 24px; background: transparent; cursor: pointer; accent-color: var(--primary-color); }
+    .palettes input[type="range"]:focus { outline: none; }
+    /* WebKit */
+    .palettes input[type="range"]::-webkit-slider-runnable-track { height: 6px; background: var(--border-color); border-radius: 999px; }
+    .palettes input[type="range"]::-webkit-slider-thumb { -webkit-appearance: none; appearance: none; margin-top: -6px; width: 18px; height: 18px; background: var(--primary-color); border: 2px solid var(--surface-bg); border-radius: 50%; }
+    /* Firefox */
+    .palettes input[type="range"]::-moz-range-track { height: 6px; background: var(--border-color); border: none; border-radius: 999px; }
+    .palettes input[type="range"]::-moz-range-progress { height: 6px; background: var(--primary-color); border-radius: 999px; }
+    .palettes input[type="range"]::-moz-range-thumb { width: 18px; height: 18px; background: var(--primary-color); border: 2px solid var(--surface-bg); border-radius: 50%; }
+    /* Page-wide color vision simulation classes */
+    html.cb-grayscale, body.cb-grayscale { filter: grayscale(1) !important; }
+    html.cb-protanopia, body.cb-protanopia { filter: url(#cb-protanopia) !important; }
+    html.cb-deuteranopia, body.cb-deuteranopia { filter: url(#cb-deuteranopia) !important; }
+    html.cb-tritanopia, body.cb-tritanopia { filter: url(#cb-tritanopia) !important; }
+    html.cb-achromatopsia, body.cb-achromatopsia { filter: url(#cb-achromatopsia) !important; }
+    @media (max-width: 640px) {
+      .palettes .palette-card { grid-template-columns: 1fr; align-items: stretch; gap: 10px; }
+      .palettes .palette-card__swatches { grid-template-columns: repeat(6, minmax(0, 1fr));  }
+      .palettes .palette-card__content { border-right: none; padding-right: 0; }
+      .palettes .palette-card__actions { justify-self: start; }
+      
+    }
+  </style>
+  <div class="palettes__controls">
+    <div class="palettes__field">
+      <label class="palettes__label" for="cb-select">Color vision simulation</label>
+      <select id="cb-select" class="palettes__select">
+        <option value="none">Normal color vision — typical for most people</option>
+        <option value="achromatopsia">Achromatopsia — no color at all</option>
+        <option value="protanopia">Protanopia — reduced/absent reds</option>
+        <option value="deuteranopia">Deuteranopia — reduced/absent greens</option>
+        <option value="tritanopia">Tritanopia — reduced/absent blues</option>
+      </select>
+    </div>
+    <div class="palettes__field">
+      <div class="palettes__label-row">
+        <label class="palettes__label" for="color-count">Number of colors</label>
+        <output id="color-count-out" for="color-count" class="ghost-badge">8</output>
+      </div>
+      <div class="palettes__count">
+        <input id="color-count" type="range" min="6" max="10" step="1" value="8" aria-label="Number of colors" />
+      </div>
+    </div>
+  </div>
+  <div class="palettes__grid"></div>
+  <div class="palettes__simu" role="group" aria-labelledby="cb-sim-title">
+    <!-- Hidden SVG filters used by the page-wide simulation classes -->
+    <svg aria-hidden="true" focusable="false" width="0" height="0" style="position:absolute; left:-9999px; overflow:hidden;">
+      <defs>
+        <!-- Matrices from common color vision deficiency simulations -->
+        <filter id="cb-protanopia">
+          <feColorMatrix type="matrix" values="0.567 0.433 0     0 0  0.558 0.442 0     0 0  0      0.242 0.758 0 0  0 0 0 1 0"/>
+        </filter>
+        <filter id="cb-deuteranopia">
+          <feColorMatrix type="matrix" values="0.625 0.375 0     0 0  0.7   0.3   0     0 0  0      0.3   0.7   0 0  0 0 0 1 0"/>
+        </filter>
+        <filter id="cb-tritanopia">
+          <feColorMatrix type="matrix" values="0.95  0.05  0     0 0  0     0.433 0.567 0 0  0     0.475 0.525 0 0  0 0 0 1 0"/>
+        </filter>
+        <filter id="cb-achromatopsia">
+          <feColorMatrix type="matrix" values="0.299 0.587 0.114 0 0  0.299 0.587 0.114 0 0  0.299 0.587 0.114 0 0  0 0 0 1 0"/>
+        </filter>
+      </defs>
+    </svg>
+  </div>
+</div>
+<script>
+  (() => {
+    const cards = [
+      { key: 'categorical', title: 'Categorical', desc: 'For <strong>non‑numeric categories</strong>; <strong>visually distinct</strong> colors. The more you have the more likely they are to look similar.' },
+      { key: 'sequential', title: 'Sequential', desc: 'For <strong>numeric scales</strong>; gradient from <strong>dark to light</strong>. Ideal for <strong>heatmaps</strong>.' },
+      { key: 'diverging', title: 'Diverging', desc: 'Opposing extremes via <strong>base → white → complement</strong>; smooth contrast around a neutral midpoint.' }
+    ];
+
+    const getPaletteColors = (key, count) => {
+      const total = Number(count) || 6;
+      if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+        return window.ColorPalettes.getColors(key, total) || [];
+      }
+      return [];
+    };
+
+    const render = () => {
+      const mount = document.currentScript ? document.currentScript.previousElementSibling : null;
+      const root = mount && mount.closest('.palettes') ? mount.closest('.palettes') : document.querySelector('.palettes');
+      if (!root) return;
+      const grid = root.querySelector('.palettes__grid');
+      if (!grid) return;
+      const input = document.getElementById('color-count');
+      const total = input ? Number(input.value) || 6 : 6;
+      const html = cards.map((c) => {
+        const colors = getPaletteColors(c.key, total);
+        const swatches = colors.map(col => `<div class="sw" style="background:${col}"></div>`).join('');
+        return `
+          <div class="palette-card" data-colors="${colors.join(',')}">
+            <div class="palette-card__content">
+              <div class="palette-card__content__info">
+                <div class="palette-card__title">${c.title}</div>
+                <div class="palette-card__desc">${c.desc}</div>
+              </div>
+              <button class="copy-btn button--ghost" type="button" aria-label="Copy palette">
+                <svg viewBox="0 0 24 24" aria-hidden="true" focusable="false"><path d="M16 1H4c-1.1 0-2 .9-2 2v12h2V3h12V1zm3 4H8c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h11c1.1 0 2-.9 2-2V7c0-1.1-.9-2-2-2zm0 16H8V7h11v14z"/></svg>
+              </button>
+            </div>
+            <div class="palette-card__actions"></div>
+            <div class="palette-card__swatches" style="grid-template-columns: repeat(${colors.length}, minmax(0, 1fr));">${swatches}</div>
+          </div>
+        `;
+      }).join('');
+      grid.innerHTML = html;
+    };
+
+    const MODE_TO_CLASS = { protanopia: 'cb-protanopia', deuteranopia: 'cb-deuteranopia', tritanopia: 'cb-tritanopia', achromatopsia: 'cb-achromatopsia' };
+    const CLEAR_CLASSES = Object.values(MODE_TO_CLASS);
+    const clearCbClasses = () => {
+      const rootEl = document.documentElement;
+      CLEAR_CLASSES.forEach(cls => rootEl.classList.remove(cls));
+    };
+    const applyCbClass = (mode) => {
+      clearCbClasses();
+      const cls = MODE_TO_CLASS[mode];
+      if (cls) document.documentElement.classList.add(cls);
+    };
+    const currentCbMode = () => {
+      const rootEl = document.documentElement;
+      for (const [mode, cls] of Object.entries(MODE_TO_CLASS)) { if (rootEl.classList.contains(cls)) return mode; }
+      return 'none';
+    };
+    const setupCbSim = () => {
+      const select = document.getElementById('cb-select');
+      if (!select) return;
+      try { select.value = currentCbMode(); } catch {}
+      select.addEventListener('change', () => applyCbClass(select.value));
+    };
+
+    const setupCountControl = () => {
+      const input = document.getElementById('color-count');
+      const out = document.getElementById('color-count-out');
+      if (!input) return;
+      const clamp = (n, min, max) => Math.max(min, Math.min(max, n));
+      const read = () => clamp(Number(input.value) || 6, 6, 10);
+      const syncOut = () => { if (out) out.textContent = String(read()); };
+      const onChange = () => { syncOut(); render(); };
+      syncOut();
+      input.addEventListener('input', onChange);
+      document.addEventListener('palettes:updated', () => { syncOut(); render(); });
+    };
+
+    let copyDelegationSetup = false;
+    const setupCopyDelegation = () => {
+      if (copyDelegationSetup) return;
+      const root = document.querySelector('.palettes');
+      if (!root) return;
+      const grid = root.querySelector('.palettes__grid');
+      if (!grid) return;
+      grid.addEventListener('click', async (e) => {
+        const target = e.target.closest ? e.target.closest('.copy-btn') : null;
+        if (!target) return;
+        const card = target.closest('.palette-card');
+        if (!card) return;
+        const colors = (card.dataset.colors || '').split(',').filter(Boolean);
+        const json = JSON.stringify(colors, null, 2);
+        try {
+          await navigator.clipboard.writeText(json);
+          const old = target.innerHTML;
+          target.innerHTML = '<svg viewBox="0 0 24 24" aria-hidden="true" focusable="false"><path d="M9 16.2l-3.5-3.5-1.4 1.4L9 19 20.3 7.7l-1.4-1.4z"/></svg>';
+          setTimeout(() => target.innerHTML = old, 900);
+        } catch {
+          window.prompt('Copy palette', json);
+        }
+      });
+      copyDelegationSetup = true;
+    };
+
+    const bootstrap = () => {
+      setupCbSim();
+      setupCountControl();
+      render();
+      setupCopyDelegation();
+      // Re-render when primary color changes
+      document.addEventListener('palettes:updated', render);
+    };
+
+    if (document.readyState === 'loading') document.addEventListener('DOMContentLoaded', bootstrap, { once: true });
+    else bootstrap();
+  })();
+</script>
+
diff --git a/app/src/content/embeds/original_embeds/plotly/banner.py b/app/src/content/embeds/original_embeds/plotly/banner.py
new file mode 100644
index 0000000000000000000000000000000000000000..73841e91b8ae9a0e1d4dcca0e6534b507b0baabe
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/banner.py
@@ -0,0 +1,134 @@
+import plotly.graph_objects as go
+import numpy as np
+import pandas as pd
+
+# Scene parameters (same ranges as the Astro integration)
+cx, cy = 1.5, 0.5                 # center
+a, b = 1.3, 0.45                  # max extent in x/y (ellipse for anisotropy)
+
+# Spiral galaxy parameters
+num_points = 3000                 # more dots
+num_arms = 3                      # number of spiral arms
+num_turns = 2.1                   # number of turns per arm
+angle_jitter = 0.12               # angular jitter to fan out the arms
+pos_noise = 0.015                 # global position noise
+
+# Generate points along spiral arms (Archimedean spiral)
+t = np.random.rand(num_points) * (2 * np.pi * num_turns)  # progression along the arm
+arm_indices = np.random.randint(0, num_arms, size=num_points)
+arm_offsets = arm_indices * (2 * np.pi / num_arms)
+
+theta = t + arm_offsets + np.random.randn(num_points) * angle_jitter
+
+# Normalized radius (0->center, 1->edge). Power <1 to densify the core
+r_norm = (t / (2 * np.pi * num_turns)) ** 0.9
+
+# Radial/lateral noise that slightly increases with radius
+noise_x = pos_noise * (0.8 + 0.6 * r_norm) * np.random.randn(num_points)
+noise_y = pos_noise * (0.8 + 0.6 * r_norm) * np.random.randn(num_points)
+
+# Elliptic projection
+x_spiral = cx + a * r_norm * np.cos(theta) + noise_x
+y_spiral = cy + b * r_norm * np.sin(theta) + noise_y
+
+# Central bulge (additional points very close to the core)
+bulge_points = int(0.18 * num_points)
+phi_b = 2 * np.pi * np.random.rand(bulge_points)
+r_b = (np.random.rand(bulge_points) ** 2.2) * 0.22  # compact bulge
+noise_x_b = (pos_noise * 0.6) * np.random.randn(bulge_points)
+noise_y_b = (pos_noise * 0.6) * np.random.randn(bulge_points)
+x_bulge = cx + a * r_b * np.cos(phi_b) + noise_x_b
+y_bulge = cy + b * r_b * np.sin(phi_b) + noise_y_b
+
+# Concatenation
+x = np.concatenate([x_spiral, x_bulge])
+y = np.concatenate([y_spiral, y_bulge])
+
+# Central intensity (for sizes/colors). 1 at center, ~0 at edge
+z_spiral = 1 - r_norm
+z_bulge = 1 - (r_b / max(r_b.max(), 1e-6))  # very bright bulge
+z_raw = np.concatenate([z_spiral, z_bulge])
+
+# Sizes: keep the 5..10 scale for consistency
+sizes = (z_raw + 1) * 5
+
+# Remove intermediate filtering: keep all placed points, filter at the very end
+
+df = pd.DataFrame({
+    "x": x,
+    "y": y,
+    "z": sizes,  # reused for size+color as before
+})
+
+def get_label(z):
+    if z < 0.25:
+        return "smol dot"
+    if z < 0.5:
+        return "ok-ish dot"
+    if z < 0.75:
+        return "a dot"
+    else:
+        return "biiig dot"
+
+# Labels based on central intensity
+df["label"] = pd.Series(z_raw).apply(get_label)
+
+# Rendering order: small points first, big ones after (on top)
+df = df.sort_values(by="z", ascending=True).reset_index(drop=True)
+
+fig = go.Figure()
+
+fig.add_trace(go.Scattergl(
+    x=df['x'],
+    y=df['y'],
+    mode='markers',
+    marker=dict(
+        size=df['z'],
+        color=df['z'],
+        colorscale=[
+            [0, 'rgb(78, 165, 183)'],
+            [0.5, 'rgb(206, 192, 250)'],
+            [1, 'rgb(232, 137, 171)']
+        ],
+        opacity=0.9,
+    ),
+    customdata=df[["label"]],
+    hovertemplate="Dot category: %{customdata[0]}",
+    hoverlabel=dict(namelength=0),
+    showlegend=False
+))
+
+fig.update_layout(
+    autosize=True,
+    paper_bgcolor='rgba(0,0,0,0)',
+    plot_bgcolor='rgba(0,0,0,0)',
+    showlegend=False,
+    margin=dict(l=0, r=0, t=0, b=0),
+    xaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showticklabels=False,
+        range=[0, 3]
+    ),
+    yaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showticklabels=False,
+        scaleanchor="x",
+        scaleratio=1,
+        range=[0, 1]
+    )
+)
+
+# fig.show()
+
+fig.write_html(
+    "../app/src/content/fragments/banner.html",
+    include_plotlyjs=False,
+    full_html=False,
+    config={
+        'displayModeBar': False,
+        'responsive': True,
+        'scrollZoom': False,
+    }
+)
\ No newline at end of file
diff --git a/app/src/content/embeds/original_embeds/plotly/bar.py b/app/src/content/embeds/original_embeds/plotly/bar.py
new file mode 100644
index 0000000000000000000000000000000000000000..4137fb1a2f90da2f7cf2ad1aec4bc15ca9c5720a
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/bar.py
@@ -0,0 +1,173 @@
+import plotly.graph_objects as go
+import plotly.io as pio
+import numpy as np
+
+"""
+Stacked bar chart: GPU memory breakdown vs sequence length, with menus for Model Size and Recomputation.
+Responsive, no zoom/pan, clean hover; styled to match the minimal theme.
+"""
+
+# Axes
+seq_labels = ["1024", "2048", "4096", "8192"]
+seq_scale = np.array([1, 2, 4, 8], dtype=float)
+
+# Components and colors (aligned with the provided example)
+components = [
+    ("parameters", "rgb(78, 165, 183)"),
+    ("gradients",  "rgb(227, 138, 66)"),
+    ("optimizer",  "rgb(232, 137, 171)"),
+    ("activations", "rgb(206, 192, 250)"),
+]
+
+# Model sizes and base memory (GB) for params/grad/opt (constant vs seq), by size
+model_sizes = ["1B", "3B", "8B", "70B", "405B"]
+params_mem = {
+    "1B": 4.0,
+    "3B": 13.3,
+    "8B": 26.0,
+    "70B": 244.0,
+    "405B": 1520.0,
+}
+# Optimizer ~= 2x params; gradients ~= params (illustrative)
+
+# Activations base coefficient per size (growth ~ coeff * (seq/1024)^2)
+act_coeff = {
+    "1B": 3.6,
+    "3B": 9.3,
+    "8B": 46.2,
+    "70B": 145.7,
+    "405B": 1519.9,
+}
+
+def activations_curve(size_key: str, recompute: str) -> np.ndarray:
+    base = act_coeff[size_key] * (seq_scale ** 2)
+    if recompute == "selective":
+        return base * 0.25
+    if recompute == "full":
+        return base * (1.0/16.0)
+    return base
+
+def stack_for(size_key: str, recompute: str):
+    p = np.full_like(seq_scale, params_mem[size_key], dtype=float)
+    g = np.full_like(seq_scale, params_mem[size_key], dtype=float)
+    o = np.full_like(seq_scale, 2.0 * params_mem[size_key], dtype=float)
+    a = activations_curve(size_key, recompute)
+    return {
+        "parameters": p,
+        "gradients": g,
+        "optimizer": o,
+        "activations": a,
+    }
+
+# Precompute all combinations
+recomp_modes = ["none", "selective", "full"]
+Y = {mode: {size: stack_for(size, mode) for size in model_sizes} for mode in recomp_modes}
+
+# Build traces: 4 traces per size (20 total). Start with size index 0 visible
+fig = go.Figure()
+for size in model_sizes:
+    for comp_name, color in components:
+        fig.add_bar(
+            x=seq_labels,
+            y=Y["none"][size][comp_name],
+            name=comp_name,
+            marker=dict(color=color),
+            hovertemplate="Seq len=%{x}<br>Mem=%{y:.1f}GB<br>%{data.name}<extra></extra>",
+            showlegend=True,
+            visible=(size == model_sizes[0]),
+        )
+
+# Compute y-axis ranges per size and recomputation
+def max_total(size: str, mode: str) -> float:
+    stacks = Y[mode][size]
+    totals = stacks["parameters"] + stacks["gradients"] + stacks["optimizer"] + stacks["activations"]
+    return float(np.max(totals))
+
+layout_y_ranges = {mode: {size: 1.05 * max_total(size, mode) for size in model_sizes} for mode in recomp_modes}
+
+# Layout
+fig.update_layout(
+    barmode="stack",
+    autosize=True,
+    paper_bgcolor="rgba(0,0,0,0)",
+    plot_bgcolor="rgba(0,0,0,0)",
+    margin=dict(l=40, r=28, t=20, b=40),
+    hovermode="x unified",
+    legend=dict(orientation="h", yanchor="bottom", y=1.02, xanchor="left", x=0),
+    xaxis=dict(title=dict(text="Sequence Length"), fixedrange=True),
+    yaxis=dict(title=dict(text="Memory (GB)"), fixedrange=True),
+)
+
+# Updatemenus: Model Size (toggle visibility)
+buttons_sizes = []
+for i, size in enumerate(model_sizes):
+    visible = [False] * (len(model_sizes) * len(components))
+    start = i * len(components)
+    for j in range(len(components)):
+        visible[start + j] = True
+    buttons_sizes.append(dict(
+        label=size,
+        method="update",
+        args=[
+            {"visible": visible},
+            {"yaxis": {"range": [0, layout_y_ranges["none"][size]]}},
+        ],
+    ))
+
+# Updatemenus: Recomputation (restyle y across all traces)
+def y_for_mode(mode: str):
+    ys = []
+    for size in model_sizes:
+        stacks = Y[mode][size]
+        for comp_name, _ in components:
+            ys.append(stacks[comp_name])
+    return ys
+
+buttons_recomp = []
+for mode, label in [("none", "None"), ("selective", "selective"), ("full", "full")]:
+    ys = y_for_mode(mode)
+    # Flatten into the format expected by Plotly for multiple traces
+    buttons_recomp.append(dict(
+        label=label,
+        method="update",
+        args=[
+            {"y": ys},
+            {"yaxis": {"range": [0, max(layout_y_ranges[mode].values())]}},
+        ],
+    ))
+
+fig.update_layout(
+    updatemenus=[
+        dict(
+            type="dropdown",
+            x=1.03, xanchor="left",
+            y=0.60, yanchor="top",
+            showactive=True,
+            active=0,
+            buttons=buttons_sizes,
+        ),
+        dict(
+            type="dropdown",
+            x=1.03, xanchor="left",
+            y=0.40, yanchor="top",
+            showactive=True,
+            active=0,
+            buttons=buttons_recomp,
+        ),
+    ],
+    annotations=[
+        dict(text="Model Size:", x=1.03, xanchor="left", xref="paper", y=0.60, yanchor="bottom", yref="paper", showarrow=False),
+        dict(text="Recomputation:", x=1.03, xanchor="left", xref="paper", y=0.40, yanchor="bottom", yref="paper", showarrow=False),
+    ],
+)
+
+# Write fragment
+fig.write_html("../../app/src/content/fragments/bar.html",
+               include_plotlyjs=False,
+               full_html=False,
+               config={
+                   'displayModeBar': False,
+                   'responsive': True,
+                   'scrollZoom': False,
+               })
+
diff --git a/app/src/content/embeds/original_embeds/plotly/heatmap.py b/app/src/content/embeds/original_embeds/plotly/heatmap.py
new file mode 100644
index 0000000000000000000000000000000000000000..3ca90d9eb42502e593dad2545993e6195e9d1cff
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/heatmap.py
@@ -0,0 +1,125 @@
+import plotly.graph_objects as go
+import plotly.io as pio
+import numpy as np
+import datetime as dt
+import os
+
+"""
+Calendar-like heatmap (GitHub-style) over the last 52 weeks.
+Minimal, responsive, transparent background; suitable for Distill.
+"""
+
+# Parameters
+NUM_WEEKS = 52
+DAYS = ["Mon", "Tue", "Wed", "Thu", "Fri", "Sat", "Sun"]
+
+# Build dates matrix (7 rows x NUM_WEEKS columns)
+today = dt.date.today()
+# Align to start of current week (Monday)
+start = today - dt.timedelta(days=(today.weekday()))  # Monday of current week
+weeks = [start - dt.timedelta(weeks=w) for w in range(NUM_WEEKS-1, -1, -1)]
+dates = [[weeks[c] + dt.timedelta(days=r) for c in range(NUM_WEEKS)] for r in range(7)]
+
+# Generate values (synthetic) — smooth seasonal pattern + noise
+def gen_value(d: dt.date) -> float:
+    day_of_year = d.timetuple().tm_yday
+    base = 0.5 + 0.45 * np.sin(2 * np.pi * (day_of_year / 365.0))
+    noise = np.random.default_rng(hash(d) % 2**32).uniform(-0.15, 0.15)
+    return max(0.0, min(1.0, base + noise))
+
+z = [[gen_value(d) for d in row] for row in dates]
+custom = [[d.isoformat() for d in row] for row in dates]
+
+# Colors aligned with other charts (slate / blue / gray)
+colorscale = [
+    [0.00, "#e5e7eb"],   # light gray background for low
+    [0.40, "#64748b"],   # slate-500
+    [0.75, "#2563eb"],   # blue-600
+    [1.00, "#4b5563"],   # gray-600 (high end accent)
+]
+
+fig = go.Figure(
+    data=go.Heatmap(
+        z=z,
+        x=[w.isoformat() for w in weeks],
+        y=DAYS,
+        colorscale=colorscale,
+        showscale=False,
+        hovertemplate="Date: %{customdata}<br>Value: %{z:.2f}<extra></extra>",
+        customdata=custom,
+        xgap=2,
+        ygap=2,
+    )
+)
+
+fig.update_layout(
+    autosize=True,
+    paper_bgcolor="rgba(0,0,0,0)",
+    plot_bgcolor="rgba(0,0,0,0)",
+    margin=dict(l=28, r=12, t=8, b=28),
+    xaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showline=False,
+        ticks="",
+        showticklabels=False,
+        fixedrange=True,
+    ),
+    yaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showline=False,
+        ticks="",
+        tickfont=dict(size=12, color="rgba(0,0,0,0.65)"),
+        fixedrange=True,
+    ),
+)
+
+post_script = """
+(function(){
+  var plots = document.querySelectorAll('.js-plotly-plot');
+  plots.forEach(function(gd){
+    function round(){
+      try {
+        var root = gd && gd.parentNode ? gd.parentNode : document;
+        var rects = root.querySelectorAll('.hoverlayer .hovertext rect');
+        rects.forEach(function(r){ r.setAttribute('rx', 8); r.setAttribute('ry', 8); });
+      } catch(e) {}
+    }
+    if (gd && gd.on){
+      gd.on('plotly_hover', round);
+      gd.on('plotly_unhover', round);
+      gd.on('plotly_relayout', round);
+    }
+    setTimeout(round, 0);
+  });
+})();
+"""
+
+html = pio.to_html(
+    fig,
+    include_plotlyjs=False,
+    full_html=False,
+    post_script=post_script,
+    config={
+        "displayModeBar": False,
+        "responsive": True,
+        "scrollZoom": False,
+        "doubleClick": False,
+        "modeBarButtonsToRemove": [
+            "zoom2d", "pan2d", "select2d", "lasso2d",
+            "zoomIn2d", "zoomOut2d", "autoScale2d", "resetScale2d",
+            "toggleSpikelines"
+        ],
+    },
+)
+
+fig.write_html("../app/src/content/fragments/heatmap.html", 
+               include_plotlyjs=False, 
+               full_html=False, 
+               config={
+                   'displayModeBar': False,
+                   'responsive': True, 
+                   'scrollZoom': False,
+               })
+
diff --git a/app/src/content/embeds/original_embeds/plotly/line.py b/app/src/content/embeds/original_embeds/plotly/line.py
new file mode 100644
index 0000000000000000000000000000000000000000..1fc71f26a0f3385b8c5455c6668abb2d26333e0f
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/line.py
@@ -0,0 +1,276 @@
+import plotly.graph_objects as go
+import plotly.io as pio
+import numpy as np
+import os
+import uuid
+
+"""
+Interactive line chart example (Baseline / Improved / Target) with a live slider.
+
+Context: research-style training curves for multiple datasets (CIFAR-10, CIFAR-100, ImageNet-1K).
+The slider "Augmentation α" blends the Improved curve between the Baseline (α=0)
+and an augmented counterpart (α=1) via a simple mixing equation.
+Export remains responsive, with no zoom and no mode bar.
+"""
+
+# Grid (x) and parameterization
+N = 240
+x = np.linspace(0, 1, N)
+
+# Logistic helper for smooth learning curves
+def logistic(xv: np.ndarray, ymin: float, ymax: float, k: float, x0: float) -> np.ndarray:
+    return ymin + (ymax - ymin) / (1.0 + np.exp(-k * (xv - x0)))
+
+# Plausible dataset params (baseline vs augmented) + a constant target line
+datasets_params = [
+    {
+        "name": "CIFAR-10",
+        "base": {"ymin": 0.10, "ymax": 0.90, "k": 10.0, "x0": 0.55},
+        "aug":  {"ymin": 0.15, "ymax": 0.96, "k": 12.0, "x0": 0.40},
+        "target": 0.97,
+    },
+    {
+        "name": "CIFAR-100",
+        "base": {"ymin": 0.05, "ymax": 0.70, "k": 9.5, "x0": 0.60},
+        "aug":  {"ymin": 0.08, "ymax": 0.80, "k": 11.0, "x0": 0.45},
+        "target": 0.85,
+    },
+    {
+        "name": "ImageNet-1K",
+        "base": {"ymin": 0.02, "ymax": 0.68, "k": 8.5, "x0": 0.65},
+        "aug":  {"ymin": 0.04, "ymax": 0.75, "k": 9.5, "x0": 0.50},
+        "target": 0.82,
+    },
+]
+
+# Initial dataset index and alpha
+alpha0 = 0.7
+ds0 = datasets_params[0]
+base0 = logistic(x, **ds0["base"])
+aug0 = logistic(x, **ds0["aug"])
+target0 = np.full_like(x, ds0["target"], dtype=float)
+
+# Traces: Baseline (fixed), Improved (blended by α), Target (constant goal)
+blend = lambda l, e, a: (1 - a) * l + a * e
+y1 = base0
+y2 = blend(base0, aug0, alpha0)
+y3 = target0
+
+color_base = "#64748b"     # slate-500
+color_improved = "#F981D4" # pink
+color_target = "#4b5563"   # gray-600 (dash)
+
+fig = go.Figure()
+fig.add_trace(
+    go.Scatter(
+        x=x,
+        y=y1,
+        name="Baseline",
+        mode="lines",
+        line=dict(color=color_base, width=2, shape="spline", smoothing=0.6),
+        hovertemplate="<b>%{fullData.name}</b><br>x=%{x:.2f}<br>y=%{y:.3f}<extra></extra>",
+        showlegend=True,
+    )
+)
+fig.add_trace(
+    go.Scatter(
+        x=x,
+        y=y2,
+        name="Improved",
+        mode="lines",
+        line=dict(color=color_improved, width=2, shape="spline", smoothing=0.6),
+        hovertemplate="<b>%{fullData.name}</b><br>x=%{x:.2f}<br>y=%{y:.3f}<extra></extra>",
+        showlegend=True,
+    )
+)
+fig.add_trace(
+    go.Scatter(
+        x=x,
+        y=y3,
+        name="Target",
+        mode="lines",
+        line=dict(color=color_target, width=2, dash="dash"),
+        hovertemplate="<b>%{fullData.name}</b><br>x=%{x:.2f}<br>y=%{y:.3f}<extra></extra>",
+        showlegend=True,
+    )
+)
+
+fig.update_layout(
+    autosize=True,
+    paper_bgcolor="rgba(0,0,0,0)",
+    plot_bgcolor="rgba(0,0,0,0)",
+    margin=dict(l=40, r=28, t=20, b=40),
+    hovermode="x unified",
+    legend=dict(
+        orientation="v",
+        x=1,
+        y=0,
+        xanchor="right",
+        yanchor="bottom",
+        bgcolor="rgba(255,255,255,0)",
+        borderwidth=0,
+    ),
+    hoverlabel=dict(
+        bgcolor="white",
+        font=dict(color="#111827", size=12),
+        bordercolor="rgba(0,0,0,0.15)",
+        align="left",
+        namelength=-1,
+    ),
+    xaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showline=True,
+        linecolor="rgba(0,0,0,0.25)",
+        linewidth=1,
+        ticks="outside",
+        ticklen=6,
+        tickcolor="rgba(0,0,0,0.25)",
+        tickfont=dict(size=12, color="rgba(0,0,0,0.55)"),
+        title=None,
+        automargin=True,
+        fixedrange=True,
+    ),
+    yaxis=dict(
+        showgrid=False,
+        zeroline=False,
+        showline=True,
+        linecolor="rgba(0,0,0,0.25)",
+        linewidth=1,
+        ticks="outside",
+        ticklen=6,
+        tickcolor="rgba(0,0,0,0.25)",
+        tickfont=dict(size=12, color="rgba(0,0,0,0.55)"),
+        title=None,
+        tickformat=".2f",
+        rangemode="tozero",
+        automargin=True,
+        fixedrange=True,
+    ),
+)
+
+# Write the fragment next to this file into src/fragments/line.html (robust path)
+output_path = os.path.join(os.path.dirname(__file__), "fragments", "line.html")
+os.makedirs(os.path.dirname(output_path), exist_ok=True)
+
+# Inject a small post-render script to round the hover box corners
+post_script = """
+(function(){
+  function attach(gd){
+    function round(){
+      try {
+        var root = gd && gd.parentNode ? gd.parentNode : document;
+        var rects = root.querySelectorAll('.hoverlayer .hovertext rect');
+        rects.forEach(function(r){ r.setAttribute('rx', 8); r.setAttribute('ry', 8); });
+      } catch(e) {}
+    }
+    if (gd && gd.on) {
+      gd.on('plotly_hover', round);
+      gd.on('plotly_unhover', round);
+      gd.on('plotly_relayout', round);
+    }
+    setTimeout(round, 0);
+  }
+  var plots = document.querySelectorAll('.js-plotly-plot');
+  plots.forEach(attach);
+})();
+"""
+
+html_plot = pio.to_html(
+    fig,
+    include_plotlyjs=False,
+    full_html=False,
+    post_script=post_script,
+    config={
+        "displayModeBar": False,
+        "responsive": True,
+        "scrollZoom": False,
+        "doubleClick": False,
+        "modeBarButtonsToRemove": [
+            "zoom2d", "pan2d", "select2d", "lasso2d",
+            "zoomIn2d", "zoomOut2d", "autoScale2d", "resetScale2d",
+            "toggleSpikelines"
+        ],
+    },
+)
+
+# Build a self-contained fragment with a live slider (no mouseup required)
+uid = uuid.uuid4().hex[:8]
+slider_id = f"line-ex-alpha-{uid}"
+container_id = f"line-ex-container-{uid}"
+
+slider_tpl = '''
+<div id="__CID__">
+  __PLOT__
+  <div class="plotly_controls" style="margin-top:12px; display:flex; gap:16px; align-items:center;">
+    <label style="font-size:12px;color:rgba(0,0,0,.65); display:flex; align-items:center; gap:6px; white-space:nowrap; padding:6px 10px;">
+      Dataset
+      <select id="__DSID__" style="font-size:12px; padding:2px 6px;">
+        <option value="0">CIFAR-10</option>
+        <option value="1">CIFAR-100</option>
+        <option value="2">ImageNet-1K</option>
+      </select>
+    </label>
+    <label style="font-size:12px;color:rgba(0,0,0,.65);display:flex;align-items:center;gap:10px; flex:1; padding:6px 10px;">
+      Augmentation α
+      <input id="__SID__" type="range" min="0" max="1" step="0.01" value="__A0__" style="flex:1;">
+      <span class="alpha-value">__A0__</span>
+    </label>
+  </div>
+</div>
+<script>
+(function(){
+  var container = document.getElementById('__CID__');
+  if(!container) return;
+  var gd = container.querySelector('.js-plotly-plot');
+  var slider = document.getElementById('__SID__');
+  var dsSelect = document.getElementById('__DSID__');
+  var valueEl = container.querySelector('.alpha-value');
+  var N = __N__;
+  var xs = Array.from({length: N}, function(_,i){ return i/(N-1); });
+  function logistic(x, ymin, ymax, k, x0){ return ymin + (ymax - ymin) / (1 + Math.exp(-k*(x - x0))); }
+  function blend(l,e,a){ return (1-a)*l + a*e; }
+  var datasets = [
+    { name:'CIFAR-10',  base:{ymin:0.10,ymax:0.90,k:10.0,x0:0.55}, aug:{ymin:0.15,ymax:0.96,k:12.0,x0:0.40}, target:0.97 },
+    { name:'CIFAR-100', base:{ymin:0.05,ymax:0.70,k:9.5,x0:0.60},  aug:{ymin:0.08,ymax:0.80,k:11.0,x0:0.45},  target:0.85 },
+    { name:'ImageNet-1K', base:{ymin:0.02,ymax:0.68,k:8.5,x0:0.65}, aug:{ymin:0.04,ymax:0.75,k:9.5,x0:0.50},  target:0.82 }
+  ];
+  var dsi = 0;
+  var yb = xs.map(function(x){ return logistic(x, datasets[dsi].base.ymin, datasets[dsi].base.ymax, datasets[dsi].base.k, datasets[dsi].base.x0); });
+  var ya = xs.map(function(x){ return logistic(x, datasets[dsi].aug.ymin, datasets[dsi].aug.ymax, datasets[dsi].aug.k, datasets[dsi].aug.x0); });
+  var yt = xs.map(function(){ return datasets[dsi].target; });
+  function applyAlpha(a){
+    var yi = yb.map(function(v,i){ return blend(v, ya[i], a); });
+    Plotly.restyle(gd, {y:[yi]}, [1]); // only Improved changes with α
+    if(valueEl) valueEl.textContent = a.toFixed(2);
+  }
+  function applyDataset(){
+    var d = datasets[dsi];
+    yb = xs.map(function(x){ return logistic(x, d.base.ymin, d.base.ymax, d.base.k, d.base.x0); });
+    ya = xs.map(function(x){ return logistic(x, d.aug.ymin, d.aug.ymax, d.aug.k, d.aug.x0); });
+    yt = xs.map(function(){ return d.target; });
+    var a = parseFloat(slider.value)||0;
+    var yi = yb.map(function(v,i){ return blend(v, ya[i], a); });
+    Plotly.restyle(gd, {y:[yb]}, [0]); // Baseline
+    Plotly.restyle(gd, {y:[yi]}, [1]); // Improved (blended)
+    Plotly.restyle(gd, {y:[yt]}, [2]); // Target
+  }
+  var initA = parseFloat(slider.value)||0;
+  slider.addEventListener('input', function(e){ applyAlpha(parseFloat(e.target.value)||0); });
+  dsSelect.addEventListener('change', function(e){ dsi = parseInt(e.target.value)||0; applyDataset(); });
+  setTimeout(function(){ applyDataset(); applyAlpha(initA); }, 0);
+})();
+</script>
+'''
+
+slider_html = (slider_tpl
+    .replace('__CID__', container_id)
+    .replace('__SID__', slider_id)
+    .replace('__A0__', f"{alpha0:.2f}")
+    .replace('__N__', str(N))
+    .replace('__PLOT__', html_plot)
+)
+
+with open("../../app/src/content/fragments/line.html", "w", encoding="utf-8") as f:
+    f.write(slider_html)
+
diff --git a/app/src/content/embeds/original_embeds/plotly/poetry.lock b/app/src/content/embeds/original_embeds/plotly/poetry.lock
new file mode 100644
index 0000000000000000000000000000000000000000..55dc5b270a044b51d1def9be28f25d940a66265f
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/poetry.lock
@@ -0,0 +1,511 @@
+# This file is automatically @generated by Poetry 2.1.3 and should not be changed by hand.
+
+[[package]]
+name = "certifi"
+version = "2025.8.3"
+description = "Python package for providing Mozilla's CA Bundle."
+optional = false
+python-versions = ">=3.7"
+groups = ["main"]
+files = [
+    {file = "certifi-2025.8.3-py3-none-any.whl", hash = "sha256:f6c12493cfb1b06ba2ff328595af9350c65d6644968e5d3a2ffd78699af217a5"},
+    {file = "certifi-2025.8.3.tar.gz", hash = "sha256:e564105f78ded564e3ae7c923924435e1daa7463faeab5bb932bc53ffae63407"},
+]
+
+[[package]]
+name = "charset-normalizer"
+version = "3.4.3"
+description = "The Real First Universal Charset Detector. Open, modern and actively maintained alternative to Chardet."
+optional = false
+python-versions = ">=3.7"
+groups = ["main"]
+files = [
+    {file = "charset_normalizer-3.4.3-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:fb7f67a1bfa6e40b438170ebdc8158b78dc465a5a67b6dde178a46987b244a72"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:cc9370a2da1ac13f0153780040f465839e6cccb4a1e44810124b4e22483c93fe"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:07a0eae9e2787b586e129fdcbe1af6997f8d0e5abaa0bc98c0e20e124d67e601"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:74d77e25adda8581ffc1c720f1c81ca082921329452eba58b16233ab1842141c"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:d0e909868420b7049dafd3a31d45125b31143eec59235311fc4c57ea26a4acd2"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:c6f162aabe9a91a309510d74eeb6507fab5fff92337a15acbe77753d88d9dcf0"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-musllinux_1_2_ppc64le.whl", hash = "sha256:4ca4c094de7771a98d7fbd67d9e5dbf1eb73efa4f744a730437d8a3a5cf994f0"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-musllinux_1_2_s390x.whl", hash = "sha256:02425242e96bcf29a49711b0ca9f37e451da7c70562bc10e8ed992a5a7a25cc0"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:78deba4d8f9590fe4dae384aeff04082510a709957e968753ff3c48399f6f92a"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-win32.whl", hash = "sha256:d79c198e27580c8e958906f803e63cddb77653731be08851c7df0b1a14a8fc0f"},
+    {file = "charset_normalizer-3.4.3-cp310-cp310-win_amd64.whl", hash = "sha256:c6e490913a46fa054e03699c70019ab869e990270597018cef1d8562132c2669"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:b256ee2e749283ef3ddcff51a675ff43798d92d746d1a6e4631bf8c707d22d0b"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:13faeacfe61784e2559e690fc53fa4c5ae97c6fcedb8eb6fb8d0a15b475d2c64"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:00237675befef519d9af72169d8604a067d92755e84fe76492fef5441db05b91"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:585f3b2a80fbd26b048a0be90c5aae8f06605d3c92615911c3a2b03a8a3b796f"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0e78314bdc32fa80696f72fa16dc61168fda4d6a0c014e0380f9d02f0e5d8a07"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:96b2b3d1a83ad55310de8c7b4a2d04d9277d5591f40761274856635acc5fcb30"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:939578d9d8fd4299220161fdd76e86c6a251987476f5243e8864a7844476ba14"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:fd10de089bcdcd1be95a2f73dbe6254798ec1bda9f450d5828c96f93e2536b9c"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:1e8ac75d72fa3775e0b7cb7e4629cec13b7514d928d15ef8ea06bca03ef01cae"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-win32.whl", hash = "sha256:6cf8fd4c04756b6b60146d98cd8a77d0cdae0e1ca20329da2ac85eed779b6849"},
+    {file = "charset_normalizer-3.4.3-cp311-cp311-win_amd64.whl", hash = "sha256:31a9a6f775f9bcd865d88ee350f0ffb0e25936a7f930ca98995c05abf1faf21c"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:e28e334d3ff134e88989d90ba04b47d84382a828c061d0d1027b1b12a62b39b1"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:0cacf8f7297b0c4fcb74227692ca46b4a5852f8f4f24b3c766dd94a1075c4884"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c6fd51128a41297f5409deab284fecbe5305ebd7e5a1f959bee1c054622b7018"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:3cfb2aad70f2c6debfbcb717f23b7eb55febc0bb23dcffc0f076009da10c6392"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:1606f4a55c0fd363d754049cdf400175ee96c992b1f8018b993941f221221c5f"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:027b776c26d38b7f15b26a5da1044f376455fb3766df8fc38563b4efbc515154"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:42e5088973e56e31e4fa58eb6bd709e42fc03799c11c42929592889a2e54c491"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:cc34f233c9e71701040d772aa7490318673aa7164a0efe3172b2981218c26d93"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:320e8e66157cc4e247d9ddca8e21f427efc7a04bbd0ac8a9faf56583fa543f9f"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-win32.whl", hash = "sha256:fb6fecfd65564f208cbf0fba07f107fb661bcd1a7c389edbced3f7a493f70e37"},
+    {file = "charset_normalizer-3.4.3-cp312-cp312-win_amd64.whl", hash = "sha256:86df271bf921c2ee3818f0522e9a5b8092ca2ad8b065ece5d7d9d0e9f4849bcc"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:14c2a87c65b351109f6abfc424cab3927b3bdece6f706e4d12faaf3d52ee5efe"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:41d1fc408ff5fdfb910200ec0e74abc40387bccb3252f3f27c0676731df2b2c8"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:1bb60174149316da1c35fa5233681f7c0f9f514509b8e399ab70fea5f17e45c9"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:30d006f98569de3459c2fc1f2acde170b7b2bd265dc1943e87e1a4efe1b67c31"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:416175faf02e4b0810f1f38bcb54682878a4af94059a1cd63b8747244420801f"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:6aab0f181c486f973bc7262a97f5aca3ee7e1437011ef0c2ec04b5a11d16c927"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:fdabf8315679312cfa71302f9bd509ded4f2f263fb5b765cf1433b39106c3cc9"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:bd28b817ea8c70215401f657edef3a8aa83c29d447fb0b622c35403780ba11d5"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:18343b2d246dc6761a249ba1fb13f9ee9a2bcd95decc767319506056ea4ad4dc"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-win32.whl", hash = "sha256:6fb70de56f1859a3f71261cbe41005f56a7842cc348d3aeb26237560bfa5e0ce"},
+    {file = "charset_normalizer-3.4.3-cp313-cp313-win_amd64.whl", hash = "sha256:cf1ebb7d78e1ad8ec2a8c4732c7be2e736f6e5123a4146c5b89c9d1f585f8cef"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-macosx_10_13_universal2.whl", hash = "sha256:3cd35b7e8aedeb9e34c41385fda4f73ba609e561faedfae0a9e75e44ac558a15"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:b89bc04de1d83006373429975f8ef9e7932534b8cc9ca582e4db7d20d91816db"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:2001a39612b241dae17b4687898843f254f8748b796a2e16f1051a17078d991d"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:8dcfc373f888e4fb39a7bc57e93e3b845e7f462dacc008d9749568b1c4ece096"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:18b97b8404387b96cdbd30ad660f6407799126d26a39ca65729162fd810a99aa"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:ccf600859c183d70eb47e05a44cd80a4ce77394d1ac0f79dbd2dd90a69a3a049"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-musllinux_1_2_ppc64le.whl", hash = "sha256:53cd68b185d98dde4ad8990e56a58dea83a4162161b1ea9272e5c9182ce415e0"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-musllinux_1_2_s390x.whl", hash = "sha256:30a96e1e1f865f78b030d65241c1ee850cdf422d869e9028e2fc1d5e4db73b92"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:d716a916938e03231e86e43782ca7878fb602a125a91e7acb8b5112e2e96ac16"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-win32.whl", hash = "sha256:c6dbd0ccdda3a2ba7c2ecd9d77b37f3b5831687d8dc1b6ca5f56a4880cc7b7ce"},
+    {file = "charset_normalizer-3.4.3-cp314-cp314-win_amd64.whl", hash = "sha256:73dc19b562516fc9bcf6e5d6e596df0b4eb98d87e4f79f3ae71840e6ed21361c"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:0f2be7e0cf7754b9a30eb01f4295cc3d4358a479843b31f328afd210e2c7598c"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c60e092517a73c632ec38e290eba714e9627abe9d301c8c8a12ec32c314a2a4b"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:252098c8c7a873e17dd696ed98bbe91dbacd571da4b87df3736768efa7a792e4"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:3653fad4fe3ed447a596ae8638b437f827234f01a8cd801842e43f3d0a6b281b"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:8999f965f922ae054125286faf9f11bc6932184b93011d138925a1773830bbe9"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-musllinux_1_2_aarch64.whl", hash = "sha256:d95bfb53c211b57198bb91c46dd5a2d8018b3af446583aab40074bf7988401cb"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-musllinux_1_2_ppc64le.whl", hash = "sha256:5b413b0b1bfd94dbf4023ad6945889f374cd24e3f62de58d6bb102c4d9ae534a"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-musllinux_1_2_s390x.whl", hash = "sha256:b5e3b2d152e74e100a9e9573837aba24aab611d39428ded46f4e4022ea7d1942"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-musllinux_1_2_x86_64.whl", hash = "sha256:a2d08ac246bb48479170408d6c19f6385fa743e7157d716e144cad849b2dd94b"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-win32.whl", hash = "sha256:ec557499516fc90fd374bf2e32349a2887a876fbf162c160e3c01b6849eaf557"},
+    {file = "charset_normalizer-3.4.3-cp38-cp38-win_amd64.whl", hash = "sha256:5d8d01eac18c423815ed4f4a2ec3b439d654e55ee4ad610e153cf02faf67ea40"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:70bfc5f2c318afece2f5838ea5e4c3febada0be750fcf4775641052bbba14d05"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:23b6b24d74478dc833444cbd927c338349d6ae852ba53a0d02a2de1fce45b96e"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:34a7f768e3f985abdb42841e20e17b330ad3aaf4bb7e7aeeb73db2e70f077b99"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:fb731e5deb0c7ef82d698b0f4c5bb724633ee2a489401594c5c88b02e6cb15f7"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:257f26fed7d7ff59921b78244f3cd93ed2af1800ff048c33f624c87475819dd7"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:1ef99f0456d3d46a50945c98de1774da86f8e992ab5c77865ea8b8195341fc19"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-musllinux_1_2_ppc64le.whl", hash = "sha256:2c322db9c8c89009a990ef07c3bcc9f011a3269bc06782f916cd3d9eed7c9312"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-musllinux_1_2_s390x.whl", hash = "sha256:511729f456829ef86ac41ca78c63a5cb55240ed23b4b737faca0eb1abb1c41bc"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:88ab34806dea0671532d3f82d82b85e8fc23d7b2dd12fa837978dad9bb392a34"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-win32.whl", hash = "sha256:16a8770207946ac75703458e2c743631c79c59c5890c80011d536248f8eaa432"},
+    {file = "charset_normalizer-3.4.3-cp39-cp39-win_amd64.whl", hash = "sha256:d22dbedd33326a4a5190dd4fe9e9e693ef12160c77382d9e87919bce54f3d4ca"},
+    {file = "charset_normalizer-3.4.3-py3-none-any.whl", hash = "sha256:ce571ab16d890d23b5c278547ba694193a45011ff86a9162a71307ed9f86759a"},
+    {file = "charset_normalizer-3.4.3.tar.gz", hash = "sha256:6fce4b8500244f6fcb71465d4a4930d132ba9ab8e71a7859e6a5d59851068d14"},
+]
+
+[[package]]
+name = "idna"
+version = "3.10"
+description = "Internationalized Domain Names in Applications (IDNA)"
+optional = false
+python-versions = ">=3.6"
+groups = ["main"]
+files = [
+    {file = "idna-3.10-py3-none-any.whl", hash = "sha256:946d195a0d259cbba61165e88e65941f16e9b36ea6ddb97f00452bae8b1287d3"},
+    {file = "idna-3.10.tar.gz", hash = "sha256:12f65c9b470abda6dc35cf8e63cc574b1c52b11df2c86030af0ac09b01b13ea9"},
+]
+
+[package.extras]
+all = ["flake8 (>=7.1.1)", "mypy (>=1.11.2)", "pytest (>=8.3.2)", "ruff (>=0.6.2)"]
+
+[[package]]
+name = "markdown"
+version = "3.8.2"
+description = "Python implementation of John Gruber's Markdown."
+optional = false
+python-versions = ">=3.9"
+groups = ["main"]
+files = [
+    {file = "markdown-3.8.2-py3-none-any.whl", hash = "sha256:5c83764dbd4e00bdd94d85a19b8d55ccca20fe35b2e678a1422b380324dd5f24"},
+    {file = "markdown-3.8.2.tar.gz", hash = "sha256:247b9a70dd12e27f67431ce62523e675b866d254f900c4fe75ce3dda62237c45"},
+]
+
+[package.extras]
+docs = ["mdx_gh_links (>=0.2)", "mkdocs (>=1.6)", "mkdocs-gen-files", "mkdocs-literate-nav", "mkdocs-nature (>=0.6)", "mkdocs-section-index", "mkdocstrings[python]"]
+testing = ["coverage", "pyyaml"]
+
+[[package]]
+name = "numpy"
+version = "2.2.6"
+description = "Fundamental package for array computing in Python"
+optional = false
+python-versions = ">=3.10"
+groups = ["main"]
+markers = "python_version == \"3.10\""
+files = [
+    {file = "numpy-2.2.6-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:b412caa66f72040e6d268491a59f2c43bf03eb6c96dd8f0307829feb7fa2b6fb"},
+    {file = "numpy-2.2.6-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:8e41fd67c52b86603a91c1a505ebaef50b3314de0213461c7a6e99c9a3beff90"},
+    {file = "numpy-2.2.6-cp310-cp310-macosx_14_0_arm64.whl", hash = "sha256:37e990a01ae6ec7fe7fa1c26c55ecb672dd98b19c3d0e1d1f326fa13cb38d163"},
+    {file = "numpy-2.2.6-cp310-cp310-macosx_14_0_x86_64.whl", hash = "sha256:5a6429d4be8ca66d889b7cf70f536a397dc45ba6faeb5f8c5427935d9592e9cf"},
+    {file = "numpy-2.2.6-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:efd28d4e9cd7d7a8d39074a4d44c63eda73401580c5c76acda2ce969e0a38e83"},
+    {file = "numpy-2.2.6-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fc7b73d02efb0e18c000e9ad8b83480dfcd5dfd11065997ed4c6747470ae8915"},
+    {file = "numpy-2.2.6-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:74d4531beb257d2c3f4b261bfb0fc09e0f9ebb8842d82a7b4209415896adc680"},
+    {file = "numpy-2.2.6-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:8fc377d995680230e83241d8a96def29f204b5782f371c532579b4f20607a289"},
+    {file = "numpy-2.2.6-cp310-cp310-win32.whl", hash = "sha256:b093dd74e50a8cba3e873868d9e93a85b78e0daf2e98c6797566ad8044e8363d"},
+    {file = "numpy-2.2.6-cp310-cp310-win_amd64.whl", hash = "sha256:f0fd6321b839904e15c46e0d257fdd101dd7f530fe03fd6359c1ea63738703f3"},
+    {file = "numpy-2.2.6-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:f9f1adb22318e121c5c69a09142811a201ef17ab257a1e66ca3025065b7f53ae"},
+    {file = "numpy-2.2.6-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:c820a93b0255bc360f53eca31a0e676fd1101f673dda8da93454a12e23fc5f7a"},
+    {file = "numpy-2.2.6-cp311-cp311-macosx_14_0_arm64.whl", hash = "sha256:3d70692235e759f260c3d837193090014aebdf026dfd167834bcba43e30c2a42"},
+    {file = "numpy-2.2.6-cp311-cp311-macosx_14_0_x86_64.whl", hash = "sha256:481b49095335f8eed42e39e8041327c05b0f6f4780488f61286ed3c01368d491"},
+    {file = "numpy-2.2.6-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b64d8d4d17135e00c8e346e0a738deb17e754230d7e0810ac5012750bbd85a5a"},
+    {file = "numpy-2.2.6-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:ba10f8411898fc418a521833e014a77d3ca01c15b0c6cdcce6a0d2897e6dbbdf"},
+    {file = "numpy-2.2.6-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:bd48227a919f1bafbdda0583705e547892342c26fb127219d60a5c36882609d1"},
+    {file = "numpy-2.2.6-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:9551a499bf125c1d4f9e250377c1ee2eddd02e01eac6644c080162c0c51778ab"},
+    {file = "numpy-2.2.6-cp311-cp311-win32.whl", hash = "sha256:0678000bb9ac1475cd454c6b8c799206af8107e310843532b04d49649c717a47"},
+    {file = "numpy-2.2.6-cp311-cp311-win_amd64.whl", hash = "sha256:e8213002e427c69c45a52bbd94163084025f533a55a59d6f9c5b820774ef3303"},
+    {file = "numpy-2.2.6-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:41c5a21f4a04fa86436124d388f6ed60a9343a6f767fced1a8a71c3fbca038ff"},
+    {file = "numpy-2.2.6-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:de749064336d37e340f640b05f24e9e3dd678c57318c7289d222a8a2f543e90c"},
+    {file = "numpy-2.2.6-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:894b3a42502226a1cac872f840030665f33326fc3dac8e57c607905773cdcde3"},
+    {file = "numpy-2.2.6-cp312-cp312-macosx_14_0_x86_64.whl", hash = "sha256:71594f7c51a18e728451bb50cc60a3ce4e6538822731b2933209a1f3614e9282"},
+    {file = "numpy-2.2.6-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f2618db89be1b4e05f7a1a847a9c1c0abd63e63a1607d892dd54668dd92faf87"},
+    {file = "numpy-2.2.6-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fd83c01228a688733f1ded5201c678f0c53ecc1006ffbc404db9f7a899ac6249"},
+    {file = "numpy-2.2.6-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:37c0ca431f82cd5fa716eca9506aefcabc247fb27ba69c5062a6d3ade8cf8f49"},
+    {file = "numpy-2.2.6-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:fe27749d33bb772c80dcd84ae7e8df2adc920ae8297400dabec45f0dedb3f6de"},
+    {file = "numpy-2.2.6-cp312-cp312-win32.whl", hash = "sha256:4eeaae00d789f66c7a25ac5f34b71a7035bb474e679f410e5e1a94deb24cf2d4"},
+    {file = "numpy-2.2.6-cp312-cp312-win_amd64.whl", hash = "sha256:c1f9540be57940698ed329904db803cf7a402f3fc200bfe599334c9bd84a40b2"},
+    {file = "numpy-2.2.6-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:0811bb762109d9708cca4d0b13c4f67146e3c3b7cf8d34018c722adb2d957c84"},
+    {file = "numpy-2.2.6-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:287cc3162b6f01463ccd86be154f284d0893d2b3ed7292439ea97eafa8170e0b"},
+    {file = "numpy-2.2.6-cp313-cp313-macosx_14_0_arm64.whl", hash = "sha256:f1372f041402e37e5e633e586f62aa53de2eac8d98cbfb822806ce4bbefcb74d"},
+    {file = "numpy-2.2.6-cp313-cp313-macosx_14_0_x86_64.whl", hash = "sha256:55a4d33fa519660d69614a9fad433be87e5252f4b03850642f88993f7b2ca566"},
+    {file = "numpy-2.2.6-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f92729c95468a2f4f15e9bb94c432a9229d0d50de67304399627a943201baa2f"},
+    {file = "numpy-2.2.6-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1bc23a79bfabc5d056d106f9befb8d50c31ced2fbc70eedb8155aec74a45798f"},
+    {file = "numpy-2.2.6-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:e3143e4451880bed956e706a3220b4e5cf6172ef05fcc397f6f36a550b1dd868"},
+    {file = "numpy-2.2.6-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:b4f13750ce79751586ae2eb824ba7e1e8dba64784086c98cdbbcc6a42112ce0d"},
+    {file = "numpy-2.2.6-cp313-cp313-win32.whl", hash = "sha256:5beb72339d9d4fa36522fc63802f469b13cdbe4fdab4a288f0c441b74272ebfd"},
+    {file = "numpy-2.2.6-cp313-cp313-win_amd64.whl", hash = "sha256:b0544343a702fa80c95ad5d3d608ea3599dd54d4632df855e4c8d24eb6ecfa1c"},
+    {file = "numpy-2.2.6-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:0bca768cd85ae743b2affdc762d617eddf3bcf8724435498a1e80132d04879e6"},
+    {file = "numpy-2.2.6-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:fc0c5673685c508a142ca65209b4e79ed6740a4ed6b2267dbba90f34b0b3cfda"},
+    {file = "numpy-2.2.6-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:5bd4fc3ac8926b3819797a7c0e2631eb889b4118a9898c84f585a54d475b7e40"},
+    {file = "numpy-2.2.6-cp313-cp313t-macosx_14_0_x86_64.whl", hash = "sha256:fee4236c876c4e8369388054d02d0e9bb84821feb1a64dd59e137e6511a551f8"},
+    {file = "numpy-2.2.6-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e1dda9c7e08dc141e0247a5b8f49cf05984955246a327d4c48bda16821947b2f"},
+    {file = "numpy-2.2.6-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f447e6acb680fd307f40d3da4852208af94afdfab89cf850986c3ca00562f4fa"},
+    {file = "numpy-2.2.6-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:389d771b1623ec92636b0786bc4ae56abafad4a4c513d36a55dce14bd9ce8571"},
+    {file = "numpy-2.2.6-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:8e9ace4a37db23421249ed236fdcdd457d671e25146786dfc96835cd951aa7c1"},
+    {file = "numpy-2.2.6-cp313-cp313t-win32.whl", hash = "sha256:038613e9fb8c72b0a41f025a7e4c3f0b7a1b5d768ece4796b674c8f3fe13efff"},
+    {file = "numpy-2.2.6-cp313-cp313t-win_amd64.whl", hash = "sha256:6031dd6dfecc0cf9f668681a37648373bddd6421fff6c66ec1624eed0180ee06"},
+    {file = "numpy-2.2.6-pp310-pypy310_pp73-macosx_10_15_x86_64.whl", hash = "sha256:0b605b275d7bd0c640cad4e5d30fa701a8d59302e127e5f79138ad62762c3e3d"},
+    {file = "numpy-2.2.6-pp310-pypy310_pp73-macosx_14_0_x86_64.whl", hash = "sha256:7befc596a7dc9da8a337f79802ee8adb30a552a94f792b9c9d18c840055907db"},
+    {file = "numpy-2.2.6-pp310-pypy310_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:ce47521a4754c8f4593837384bd3424880629f718d87c5d44f8ed763edd63543"},
+    {file = "numpy-2.2.6-pp310-pypy310_pp73-win_amd64.whl", hash = "sha256:d042d24c90c41b54fd506da306759e06e568864df8ec17ccc17e9e884634fd00"},
+    {file = "numpy-2.2.6.tar.gz", hash = "sha256:e29554e2bef54a90aa5cc07da6ce955accb83f21ab5de01a62c8478897b264fd"},
+]
+
+[[package]]
+name = "numpy"
+version = "2.3.2"
+description = "Fundamental package for array computing in Python"
+optional = false
+python-versions = ">=3.11"
+groups = ["main"]
+markers = "python_version >= \"3.11\""
+files = [
+    {file = "numpy-2.3.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:852ae5bed3478b92f093e30f785c98e0cb62fa0a939ed057c31716e18a7a22b9"},
+    {file = "numpy-2.3.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:7a0e27186e781a69959d0230dd9909b5e26024f8da10683bd6344baea1885168"},
+    {file = "numpy-2.3.2-cp311-cp311-macosx_14_0_arm64.whl", hash = "sha256:f0a1a8476ad77a228e41619af2fa9505cf69df928e9aaa165746584ea17fed2b"},
+    {file = "numpy-2.3.2-cp311-cp311-macosx_14_0_x86_64.whl", hash = "sha256:cbc95b3813920145032412f7e33d12080f11dc776262df1712e1638207dde9e8"},
+    {file = "numpy-2.3.2-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:f75018be4980a7324edc5930fe39aa391d5734531b1926968605416ff58c332d"},
+    {file = "numpy-2.3.2-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:20b8200721840f5621b7bd03f8dcd78de33ec522fc40dc2641aa09537df010c3"},
+    {file = "numpy-2.3.2-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:1f91e5c028504660d606340a084db4b216567ded1056ea2b4be4f9d10b67197f"},
+    {file = "numpy-2.3.2-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:fb1752a3bb9a3ad2d6b090b88a9a0ae1cd6f004ef95f75825e2f382c183b2097"},
+    {file = "numpy-2.3.2-cp311-cp311-win32.whl", hash = "sha256:4ae6863868aaee2f57503c7a5052b3a2807cf7a3914475e637a0ecd366ced220"},
+    {file = "numpy-2.3.2-cp311-cp311-win_amd64.whl", hash = "sha256:240259d6564f1c65424bcd10f435145a7644a65a6811cfc3201c4a429ba79170"},
+    {file = "numpy-2.3.2-cp311-cp311-win_arm64.whl", hash = "sha256:4209f874d45f921bde2cff1ffcd8a3695f545ad2ffbef6d3d3c6768162efab89"},
+    {file = "numpy-2.3.2-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:bc3186bea41fae9d8e90c2b4fb5f0a1f5a690682da79b92574d63f56b529080b"},
+    {file = "numpy-2.3.2-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:2f4f0215edb189048a3c03bd5b19345bdfa7b45a7a6f72ae5945d2a28272727f"},
+    {file = "numpy-2.3.2-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:8b1224a734cd509f70816455c3cffe13a4f599b1bf7130f913ba0e2c0b2006c0"},
+    {file = "numpy-2.3.2-cp312-cp312-macosx_14_0_x86_64.whl", hash = "sha256:3dcf02866b977a38ba3ec10215220609ab9667378a9e2150615673f3ffd6c73b"},
+    {file = "numpy-2.3.2-cp312-cp312-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:572d5512df5470f50ada8d1972c5f1082d9a0b7aa5944db8084077570cf98370"},
+    {file = "numpy-2.3.2-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:8145dd6d10df13c559d1e4314df29695613575183fa2e2d11fac4c208c8a1f73"},
+    {file = "numpy-2.3.2-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:103ea7063fa624af04a791c39f97070bf93b96d7af7eb23530cd087dc8dbe9dc"},
+    {file = "numpy-2.3.2-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:fc927d7f289d14f5e037be917539620603294454130b6de200091e23d27dc9be"},
+    {file = "numpy-2.3.2-cp312-cp312-win32.whl", hash = "sha256:d95f59afe7f808c103be692175008bab926b59309ade3e6d25009e9a171f7036"},
+    {file = "numpy-2.3.2-cp312-cp312-win_amd64.whl", hash = "sha256:9e196ade2400c0c737d93465327d1ae7c06c7cb8a1756121ebf54b06ca183c7f"},
+    {file = "numpy-2.3.2-cp312-cp312-win_arm64.whl", hash = "sha256:ee807923782faaf60d0d7331f5e86da7d5e3079e28b291973c545476c2b00d07"},
+    {file = "numpy-2.3.2-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:c8d9727f5316a256425892b043736d63e89ed15bbfe6556c5ff4d9d4448ff3b3"},
+    {file = "numpy-2.3.2-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:efc81393f25f14d11c9d161e46e6ee348637c0a1e8a54bf9dedc472a3fae993b"},
+    {file = "numpy-2.3.2-cp313-cp313-macosx_14_0_arm64.whl", hash = "sha256:dd937f088a2df683cbb79dda9a772b62a3e5a8a7e76690612c2737f38c6ef1b6"},
+    {file = "numpy-2.3.2-cp313-cp313-macosx_14_0_x86_64.whl", hash = "sha256:11e58218c0c46c80509186e460d79fbdc9ca1eb8d8aee39d8f2dc768eb781089"},
+    {file = "numpy-2.3.2-cp313-cp313-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:5ad4ebcb683a1f99f4f392cc522ee20a18b2bb12a2c1c42c3d48d5a1adc9d3d2"},
+    {file = "numpy-2.3.2-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:938065908d1d869c7d75d8ec45f735a034771c6ea07088867f713d1cd3bbbe4f"},
+    {file = "numpy-2.3.2-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:66459dccc65d8ec98cc7df61307b64bf9e08101f9598755d42d8ae65d9a7a6ee"},
+    {file = "numpy-2.3.2-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:a7af9ed2aa9ec5950daf05bb11abc4076a108bd3c7db9aa7251d5f107079b6a6"},
+    {file = "numpy-2.3.2-cp313-cp313-win32.whl", hash = "sha256:906a30249315f9c8e17b085cc5f87d3f369b35fedd0051d4a84686967bdbbd0b"},
+    {file = "numpy-2.3.2-cp313-cp313-win_amd64.whl", hash = "sha256:c63d95dc9d67b676e9108fe0d2182987ccb0f11933c1e8959f42fa0da8d4fa56"},
+    {file = "numpy-2.3.2-cp313-cp313-win_arm64.whl", hash = "sha256:b05a89f2fb84d21235f93de47129dd4f11c16f64c87c33f5e284e6a3a54e43f2"},
+    {file = "numpy-2.3.2-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:4e6ecfeddfa83b02318f4d84acf15fbdbf9ded18e46989a15a8b6995dfbf85ab"},
+    {file = "numpy-2.3.2-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:508b0eada3eded10a3b55725b40806a4b855961040180028f52580c4729916a2"},
+    {file = "numpy-2.3.2-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:754d6755d9a7588bdc6ac47dc4ee97867271b17cee39cb87aef079574366db0a"},
+    {file = "numpy-2.3.2-cp313-cp313t-macosx_14_0_x86_64.whl", hash = "sha256:a9f66e7d2b2d7712410d3bc5684149040ef5f19856f20277cd17ea83e5006286"},
+    {file = "numpy-2.3.2-cp313-cp313t-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:de6ea4e5a65d5a90c7d286ddff2b87f3f4ad61faa3db8dabe936b34c2275b6f8"},
+    {file = "numpy-2.3.2-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a3ef07ec8cbc8fc9e369c8dcd52019510c12da4de81367d8b20bc692aa07573a"},
+    {file = "numpy-2.3.2-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:27c9f90e7481275c7800dc9c24b7cc40ace3fdb970ae4d21eaff983a32f70c91"},
+    {file = "numpy-2.3.2-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:07b62978075b67eee4065b166d000d457c82a1efe726cce608b9db9dd66a73a5"},
+    {file = "numpy-2.3.2-cp313-cp313t-win32.whl", hash = "sha256:c771cfac34a4f2c0de8e8c97312d07d64fd8f8ed45bc9f5726a7e947270152b5"},
+    {file = "numpy-2.3.2-cp313-cp313t-win_amd64.whl", hash = "sha256:72dbebb2dcc8305c431b2836bcc66af967df91be793d63a24e3d9b741374c450"},
+    {file = "numpy-2.3.2-cp313-cp313t-win_arm64.whl", hash = "sha256:72c6df2267e926a6d5286b0a6d556ebe49eae261062059317837fda12ddf0c1a"},
+    {file = "numpy-2.3.2-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:448a66d052d0cf14ce9865d159bfc403282c9bc7bb2a31b03cc18b651eca8b1a"},
+    {file = "numpy-2.3.2-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:546aaf78e81b4081b2eba1d105c3b34064783027a06b3ab20b6eba21fb64132b"},
+    {file = "numpy-2.3.2-cp314-cp314-macosx_14_0_arm64.whl", hash = "sha256:87c930d52f45df092f7578889711a0768094debf73cfcde105e2d66954358125"},
+    {file = "numpy-2.3.2-cp314-cp314-macosx_14_0_x86_64.whl", hash = "sha256:8dc082ea901a62edb8f59713c6a7e28a85daddcb67454c839de57656478f5b19"},
+    {file = "numpy-2.3.2-cp314-cp314-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:af58de8745f7fa9ca1c0c7c943616c6fe28e75d0c81f5c295810e3c83b5be92f"},
+    {file = "numpy-2.3.2-cp314-cp314-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:fed5527c4cf10f16c6d0b6bee1f89958bccb0ad2522c8cadc2efd318bcd545f5"},
+    {file = "numpy-2.3.2-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:095737ed986e00393ec18ec0b21b47c22889ae4b0cd2d5e88342e08b01141f58"},
+    {file = "numpy-2.3.2-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:b5e40e80299607f597e1a8a247ff8d71d79c5b52baa11cc1cce30aa92d2da6e0"},
+    {file = "numpy-2.3.2-cp314-cp314-win32.whl", hash = "sha256:7d6e390423cc1f76e1b8108c9b6889d20a7a1f59d9a60cac4a050fa734d6c1e2"},
+    {file = "numpy-2.3.2-cp314-cp314-win_amd64.whl", hash = "sha256:b9d0878b21e3918d76d2209c924ebb272340da1fb51abc00f986c258cd5e957b"},
+    {file = "numpy-2.3.2-cp314-cp314-win_arm64.whl", hash = "sha256:2738534837c6a1d0c39340a190177d7d66fdf432894f469728da901f8f6dc910"},
+    {file = "numpy-2.3.2-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:4d002ecf7c9b53240be3bb69d80f86ddbd34078bae04d87be81c1f58466f264e"},
+    {file = "numpy-2.3.2-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:293b2192c6bcce487dbc6326de5853787f870aeb6c43f8f9c6496db5b1781e45"},
+    {file = "numpy-2.3.2-cp314-cp314t-macosx_14_0_arm64.whl", hash = "sha256:0a4f2021a6da53a0d580d6ef5db29947025ae8b35b3250141805ea9a32bbe86b"},
+    {file = "numpy-2.3.2-cp314-cp314t-macosx_14_0_x86_64.whl", hash = "sha256:9c144440db4bf3bb6372d2c3e49834cc0ff7bb4c24975ab33e01199e645416f2"},
+    {file = "numpy-2.3.2-cp314-cp314t-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:f92d6c2a8535dc4fe4419562294ff957f83a16ebdec66df0805e473ffaad8bd0"},
+    {file = "numpy-2.3.2-cp314-cp314t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:cefc2219baa48e468e3db7e706305fcd0c095534a192a08f31e98d83a7d45fb0"},
+    {file = "numpy-2.3.2-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:76c3e9501ceb50b2ff3824c3589d5d1ab4ac857b0ee3f8f49629d0de55ecf7c2"},
+    {file = "numpy-2.3.2-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:122bf5ed9a0221b3419672493878ba4967121514b1d7d4656a7580cd11dddcbf"},
+    {file = "numpy-2.3.2-cp314-cp314t-win32.whl", hash = "sha256:6f1ae3dcb840edccc45af496f312528c15b1f79ac318169d094e85e4bb35fdf1"},
+    {file = "numpy-2.3.2-cp314-cp314t-win_amd64.whl", hash = "sha256:087ffc25890d89a43536f75c5fe8770922008758e8eeeef61733957041ed2f9b"},
+    {file = "numpy-2.3.2-cp314-cp314t-win_arm64.whl", hash = "sha256:092aeb3449833ea9c0bf0089d70c29ae480685dd2377ec9cdbbb620257f84631"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-macosx_10_15_x86_64.whl", hash = "sha256:14a91ebac98813a49bc6aa1a0dfc09513dcec1d97eaf31ca21a87221a1cdcb15"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:71669b5daae692189540cffc4c439468d35a3f84f0c88b078ecd94337f6cb0ec"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-macosx_14_0_arm64.whl", hash = "sha256:69779198d9caee6e547adb933941ed7520f896fd9656834c300bdf4dd8642712"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-macosx_14_0_x86_64.whl", hash = "sha256:2c3271cc4097beb5a60f010bcc1cc204b300bb3eafb4399376418a83a1c6373c"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:8446acd11fe3dc1830568c941d44449fd5cb83068e5c70bd5a470d323d448296"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:aa098a5ab53fa407fded5870865c6275a5cd4101cfdef8d6fafc48286a96e981"},
+    {file = "numpy-2.3.2-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:6936aff90dda378c09bea075af0d9c675fe3a977a9d2402f95a87f440f59f619"},
+    {file = "numpy-2.3.2.tar.gz", hash = "sha256:e0486a11ec30cdecb53f184d496d1c6a20786c81e55e41640270130056f8ee48"},
+]
+
+[[package]]
+name = "packaging"
+version = "25.0"
+description = "Core utilities for Python packages"
+optional = false
+python-versions = ">=3.8"
+groups = ["main"]
+files = [
+    {file = "packaging-25.0-py3-none-any.whl", hash = "sha256:29572ef2b1f17581046b3a2227d5c611fb25ec70ca1ba8554b24b0e69331a484"},
+    {file = "packaging-25.0.tar.gz", hash = "sha256:d443872c98d677bf60f6a1f2f8c1cb748e8fe762d2bf9d3148b5599295b0fc4f"},
+]
+
+[[package]]
+name = "pandas"
+version = "2.3.2"
+description = "Powerful data structures for data analysis, time series, and statistics"
+optional = false
+python-versions = ">=3.9"
+groups = ["main"]
+files = [
+    {file = "pandas-2.3.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:52bc29a946304c360561974c6542d1dd628ddafa69134a7131fdfd6a5d7a1a35"},
+    {file = "pandas-2.3.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:220cc5c35ffaa764dd5bb17cf42df283b5cb7fdf49e10a7b053a06c9cb48ee2b"},
+    {file = "pandas-2.3.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:42c05e15111221384019897df20c6fe893b2f697d03c811ee67ec9e0bb5a3424"},
+    {file = "pandas-2.3.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:cc03acc273c5515ab69f898df99d9d4f12c4d70dbfc24c3acc6203751d0804cf"},
+    {file = "pandas-2.3.2-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:d25c20a03e8870f6339bcf67281b946bd20b86f1a544ebbebb87e66a8d642cba"},
+    {file = "pandas-2.3.2-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:21bb612d148bb5860b7eb2c10faacf1a810799245afd342cf297d7551513fbb6"},
+    {file = "pandas-2.3.2-cp310-cp310-win_amd64.whl", hash = "sha256:b62d586eb25cb8cb70a5746a378fc3194cb7f11ea77170d59f889f5dfe3cec7a"},
+    {file = "pandas-2.3.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:1333e9c299adcbb68ee89a9bb568fc3f20f9cbb419f1dd5225071e6cddb2a743"},
+    {file = "pandas-2.3.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:76972bcbd7de8e91ad5f0ca884a9f2c477a2125354af624e022c49e5bd0dfff4"},
+    {file = "pandas-2.3.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b98bdd7c456a05eef7cd21fd6b29e3ca243591fe531c62be94a2cc987efb5ac2"},
+    {file = "pandas-2.3.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1d81573b3f7db40d020983f78721e9bfc425f411e616ef019a10ebf597aedb2e"},
+    {file = "pandas-2.3.2-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:e190b738675a73b581736cc8ec71ae113d6c3768d0bd18bffa5b9a0927b0b6ea"},
+    {file = "pandas-2.3.2-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:c253828cb08f47488d60f43c5fc95114c771bbfff085da54bfc79cb4f9e3a372"},
+    {file = "pandas-2.3.2-cp311-cp311-win_amd64.whl", hash = "sha256:9467697b8083f9667b212633ad6aa4ab32436dcbaf4cd57325debb0ddef2012f"},
+    {file = "pandas-2.3.2-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:3fbb977f802156e7a3f829e9d1d5398f6192375a3e2d1a9ee0803e35fe70a2b9"},
+    {file = "pandas-2.3.2-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:1b9b52693123dd234b7c985c68b709b0b009f4521000d0525f2b95c22f15944b"},
+    {file = "pandas-2.3.2-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0bd281310d4f412733f319a5bc552f86d62cddc5f51d2e392c8787335c994175"},
+    {file = "pandas-2.3.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:96d31a6b4354e3b9b8a2c848af75d31da390657e3ac6f30c05c82068b9ed79b9"},
+    {file = "pandas-2.3.2-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:df4df0b9d02bb873a106971bb85d448378ef14b86ba96f035f50bbd3688456b4"},
+    {file = "pandas-2.3.2-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:213a5adf93d020b74327cb2c1b842884dbdd37f895f42dcc2f09d451d949f811"},
+    {file = "pandas-2.3.2-cp312-cp312-win_amd64.whl", hash = "sha256:8c13b81a9347eb8c7548f53fd9a4f08d4dfe996836543f805c987bafa03317ae"},
+    {file = "pandas-2.3.2-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:0c6ecbac99a354a051ef21c5307601093cb9e0f4b1855984a084bfec9302699e"},
+    {file = "pandas-2.3.2-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:c6f048aa0fd080d6a06cc7e7537c09b53be6642d330ac6f54a600c3ace857ee9"},
+    {file = "pandas-2.3.2-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0064187b80a5be6f2f9c9d6bdde29372468751dfa89f4211a3c5871854cfbf7a"},
+    {file = "pandas-2.3.2-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4ac8c320bded4718b298281339c1a50fb00a6ba78cb2a63521c39bec95b0209b"},
+    {file = "pandas-2.3.2-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:114c2fe4f4328cf98ce5716d1532f3ab79c5919f95a9cfee81d9140064a2e4d6"},
+    {file = "pandas-2.3.2-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:48fa91c4dfb3b2b9bfdb5c24cd3567575f4e13f9636810462ffed8925352be5a"},
+    {file = "pandas-2.3.2-cp313-cp313-win_amd64.whl", hash = "sha256:12d039facec710f7ba305786837d0225a3444af7bbd9c15c32ca2d40d157ed8b"},
+    {file = "pandas-2.3.2-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:c624b615ce97864eb588779ed4046186f967374185c047070545253a52ab2d57"},
+    {file = "pandas-2.3.2-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:0cee69d583b9b128823d9514171cabb6861e09409af805b54459bd0c821a35c2"},
+    {file = "pandas-2.3.2-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:2319656ed81124982900b4c37f0e0c58c015af9a7bbc62342ba5ad07ace82ba9"},
+    {file = "pandas-2.3.2-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b37205ad6f00d52f16b6d09f406434ba928c1a1966e2771006a9033c736d30d2"},
+    {file = "pandas-2.3.2-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:837248b4fc3a9b83b9c6214699a13f069dc13510a6a6d7f9ba33145d2841a012"},
+    {file = "pandas-2.3.2-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:d2c3554bd31b731cd6490d94a28f3abb8dd770634a9e06eb6d2911b9827db370"},
+    {file = "pandas-2.3.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:88080a0ff8a55eac9c84e3ff3c7665b3b5476c6fbc484775ca1910ce1c3e0b87"},
+    {file = "pandas-2.3.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:d4a558c7620340a0931828d8065688b3cc5b4c8eb674bcaf33d18ff4a6870b4a"},
+    {file = "pandas-2.3.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:45178cf09d1858a1509dc73ec261bf5b25a625a389b65be2e47b559905f0ab6a"},
+    {file = "pandas-2.3.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:77cefe00e1b210f9c76c697fedd8fdb8d3dd86563e9c8adc9fa72b90f5e9e4c2"},
+    {file = "pandas-2.3.2-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:13bd629c653856f00c53dc495191baa59bcafbbf54860a46ecc50d3a88421a96"},
+    {file = "pandas-2.3.2-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:36d627906fd44b5fd63c943264e11e96e923f8de77d6016dc2f667b9ad193438"},
+    {file = "pandas-2.3.2-cp39-cp39-win_amd64.whl", hash = "sha256:a9d7ec92d71a420185dec44909c32e9a362248c4ae2238234b76d5be37f208cc"},
+    {file = "pandas-2.3.2.tar.gz", hash = "sha256:ab7b58f8f82706890924ccdfb5f48002b83d2b5a3845976a9fb705d36c34dcdb"},
+]
+
+[package.dependencies]
+numpy = [
+    {version = ">=1.22.4", markers = "python_version < \"3.11\""},
+    {version = ">=1.23.2", markers = "python_version == \"3.11\""},
+    {version = ">=1.26.0", markers = "python_version >= \"3.12\""},
+]
+python-dateutil = ">=2.8.2"
+pytz = ">=2020.1"
+tzdata = ">=2022.7"
+
+[package.extras]
+all = ["PyQt5 (>=5.15.9)", "SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "adbc-driver-sqlite (>=0.8.0)", "beautifulsoup4 (>=4.11.2)", "bottleneck (>=1.3.6)", "dataframe-api-compat (>=0.1.7)", "fastparquet (>=2022.12.0)", "fsspec (>=2022.11.0)", "gcsfs (>=2022.11.0)", "html5lib (>=1.1)", "hypothesis (>=6.46.1)", "jinja2 (>=3.1.2)", "lxml (>=4.9.2)", "matplotlib (>=3.6.3)", "numba (>=0.56.4)", "numexpr (>=2.8.4)", "odfpy (>=1.4.1)", "openpyxl (>=3.1.0)", "pandas-gbq (>=0.19.0)", "psycopg2 (>=2.9.6)", "pyarrow (>=10.0.1)", "pymysql (>=1.0.2)", "pyreadstat (>=1.2.0)", "pytest (>=7.3.2)", "pytest-xdist (>=2.2.0)", "python-calamine (>=0.1.7)", "pyxlsb (>=1.0.10)", "qtpy (>=2.3.0)", "s3fs (>=2022.11.0)", "scipy (>=1.10.0)", "tables (>=3.8.0)", "tabulate (>=0.9.0)", "xarray (>=2022.12.0)", "xlrd (>=2.0.1)", "xlsxwriter (>=3.0.5)", "zstandard (>=0.19.0)"]
+aws = ["s3fs (>=2022.11.0)"]
+clipboard = ["PyQt5 (>=5.15.9)", "qtpy (>=2.3.0)"]
+compression = ["zstandard (>=0.19.0)"]
+computation = ["scipy (>=1.10.0)", "xarray (>=2022.12.0)"]
+consortium-standard = ["dataframe-api-compat (>=0.1.7)"]
+excel = ["odfpy (>=1.4.1)", "openpyxl (>=3.1.0)", "python-calamine (>=0.1.7)", "pyxlsb (>=1.0.10)", "xlrd (>=2.0.1)", "xlsxwriter (>=3.0.5)"]
+feather = ["pyarrow (>=10.0.1)"]
+fss = ["fsspec (>=2022.11.0)"]
+gcp = ["gcsfs (>=2022.11.0)", "pandas-gbq (>=0.19.0)"]
+hdf5 = ["tables (>=3.8.0)"]
+html = ["beautifulsoup4 (>=4.11.2)", "html5lib (>=1.1)", "lxml (>=4.9.2)"]
+mysql = ["SQLAlchemy (>=2.0.0)", "pymysql (>=1.0.2)"]
+output-formatting = ["jinja2 (>=3.1.2)", "tabulate (>=0.9.0)"]
+parquet = ["pyarrow (>=10.0.1)"]
+performance = ["bottleneck (>=1.3.6)", "numba (>=0.56.4)", "numexpr (>=2.8.4)"]
+plot = ["matplotlib (>=3.6.3)"]
+postgresql = ["SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "psycopg2 (>=2.9.6)"]
+pyarrow = ["pyarrow (>=10.0.1)"]
+spss = ["pyreadstat (>=1.2.0)"]
+sql-other = ["SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "adbc-driver-sqlite (>=0.8.0)"]
+test = ["hypothesis (>=6.46.1)", "pytest (>=7.3.2)", "pytest-xdist (>=2.2.0)"]
+xml = ["lxml (>=4.9.2)"]
+
+[[package]]
+name = "plotly"
+version = "5.24.1"
+description = "An open-source, interactive data visualization library for Python"
+optional = false
+python-versions = ">=3.8"
+groups = ["main"]
+files = [
+    {file = "plotly-5.24.1-py3-none-any.whl", hash = "sha256:f67073a1e637eb0dc3e46324d9d51e2fe76e9727c892dde64ddf1e1b51f29089"},
+    {file = "plotly-5.24.1.tar.gz", hash = "sha256:dbc8ac8339d248a4bcc36e08a5659bacfe1b079390b8953533f4eb22169b4bae"},
+]
+
+[package.dependencies]
+packaging = "*"
+tenacity = ">=6.2.0"
+
+[[package]]
+name = "python-dateutil"
+version = "2.9.0.post0"
+description = "Extensions to the standard Python datetime module"
+optional = false
+python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,>=2.7"
+groups = ["main"]
+files = [
+    {file = "python-dateutil-2.9.0.post0.tar.gz", hash = "sha256:37dd54208da7e1cd875388217d5e00ebd4179249f90fb72437e91a35459a0ad3"},
+    {file = "python_dateutil-2.9.0.post0-py2.py3-none-any.whl", hash = "sha256:a8b2bc7bffae282281c8140a97d3aa9c14da0b136dfe83f850eea9a5f7470427"},
+]
+
+[package.dependencies]
+six = ">=1.5"
+
+[[package]]
+name = "pytz"
+version = "2025.2"
+description = "World timezone definitions, modern and historical"
+optional = false
+python-versions = "*"
+groups = ["main"]
+files = [
+    {file = "pytz-2025.2-py2.py3-none-any.whl", hash = "sha256:5ddf76296dd8c44c26eb8f4b6f35488f3ccbf6fbbd7adee0b7262d43f0ec2f00"},
+    {file = "pytz-2025.2.tar.gz", hash = "sha256:360b9e3dbb49a209c21ad61809c7fb453643e048b38924c765813546746e81c3"},
+]
+
+[[package]]
+name = "requests"
+version = "2.32.5"
+description = "Python HTTP for Humans."
+optional = false
+python-versions = ">=3.9"
+groups = ["main"]
+files = [
+    {file = "requests-2.32.5-py3-none-any.whl", hash = "sha256:2462f94637a34fd532264295e186976db0f5d453d1cdd31473c85a6a161affb6"},
+    {file = "requests-2.32.5.tar.gz", hash = "sha256:dbba0bac56e100853db0ea71b82b4dfd5fe2bf6d3754a8893c3af500cec7d7cf"},
+]
+
+[package.dependencies]
+certifi = ">=2017.4.17"
+charset_normalizer = ">=2,<4"
+idna = ">=2.5,<4"
+urllib3 = ">=1.21.1,<3"
+
+[package.extras]
+socks = ["PySocks (>=1.5.6,!=1.5.7)"]
+use-chardet-on-py3 = ["chardet (>=3.0.2,<6)"]
+
+[[package]]
+name = "six"
+version = "1.17.0"
+description = "Python 2 and 3 compatibility utilities"
+optional = false
+python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,>=2.7"
+groups = ["main"]
+files = [
+    {file = "six-1.17.0-py2.py3-none-any.whl", hash = "sha256:4721f391ed90541fddacab5acf947aa0d3dc7d27b2e1e8eda2be8970586c3274"},
+    {file = "six-1.17.0.tar.gz", hash = "sha256:ff70335d468e7eb6ec65b95b99d3a2836546063f63acc5171de367e834932a81"},
+]
+
+[[package]]
+name = "tenacity"
+version = "9.1.2"
+description = "Retry code until it succeeds"
+optional = false
+python-versions = ">=3.9"
+groups = ["main"]
+files = [
+    {file = "tenacity-9.1.2-py3-none-any.whl", hash = "sha256:f77bf36710d8b73a50b2dd155c97b870017ad21afe6ab300326b0371b3b05138"},
+    {file = "tenacity-9.1.2.tar.gz", hash = "sha256:1169d376c297e7de388d18b4481760d478b0e99a777cad3a9c86e556f4b697cb"},
+]
+
+[package.extras]
+doc = ["reno", "sphinx"]
+test = ["pytest", "tornado (>=4.5)", "typeguard"]
+
+[[package]]
+name = "tzdata"
+version = "2025.2"
+description = "Provider of IANA time zone data"
+optional = false
+python-versions = ">=2"
+groups = ["main"]
+files = [
+    {file = "tzdata-2025.2-py2.py3-none-any.whl", hash = "sha256:1a403fada01ff9221ca8044d701868fa132215d84beb92242d9acd2147f667a8"},
+    {file = "tzdata-2025.2.tar.gz", hash = "sha256:b60a638fcc0daffadf82fe0f57e53d06bdec2f36c4df66280ae79bce6bd6f2b9"},
+]
+
+[[package]]
+name = "urllib3"
+version = "2.5.0"
+description = "HTTP library with thread-safe connection pooling, file post, and more."
+optional = false
+python-versions = ">=3.9"
+groups = ["main"]
+files = [
+    {file = "urllib3-2.5.0-py3-none-any.whl", hash = "sha256:e6b01673c0fa6a13e374b50871808eb3bf7046c4b125b216f6bf1cc604cff0dc"},
+    {file = "urllib3-2.5.0.tar.gz", hash = "sha256:3fc47733c7e419d4bc3f6b3dc2b4f890bb743906a30d56ba4a5bfa4bbff92760"},
+]
+
+[package.extras]
+brotli = ["brotli (>=1.0.9) ; platform_python_implementation == \"CPython\"", "brotlicffi (>=0.8.0) ; platform_python_implementation != \"CPython\""]
+h2 = ["h2 (>=4,<5)"]
+socks = ["pysocks (>=1.5.6,!=1.5.7,<2.0)"]
+zstd = ["zstandard (>=0.18.0)"]
+
+[metadata]
+lock-version = "2.1"
+python-versions = ">=3.10,<3.13"
+content-hash = "a7f64c43efcba78952701498a72a8fe503e995841717b2d5de4c9aa20c9a996a"
diff --git a/app/src/content/embeds/original_embeds/plotly/pyproject.toml b/app/src/content/embeds/original_embeds/plotly/pyproject.toml
new file mode 100644
index 0000000000000000000000000000000000000000..2c020f06dbed2c5d70596f65de09d943de4b100b
--- /dev/null
+++ b/app/src/content/embeds/original_embeds/plotly/pyproject.toml
@@ -0,0 +1,20 @@
+[tool.poetry]
+name = "blogpost-fine-tasks-python"
+version = "0.1.0"
+description = "Plotly fragment generation scripts and HTML/Markdown conversions for the blogpost."
+package-mode = false
+
+[tool.poetry.dependencies]
+python = ">=3.10,<3.13"
+Markdown = "^3.6"
+requests = "^2.32.3"
+numpy = "^2.0.0"
+pandas = "^2.2.2"
+plotly = "^5.24.0"
+
+[tool.poetry.scripts]
+html-to-md = "convert_to_md:main"
+
+[build-system]
+requires = ["poetry-core>=1.5.0"]
+build-backend = "poetry.core.masonry.api"
diff --git a/app/src/content/embeds/plotly-line.html b/app/src/content/embeds/plotly-line.html
new file mode 100644
index 0000000000000000000000000000000000000000..91056f958235aea35d9731272a508f8eed2e7add
--- /dev/null
+++ b/app/src/content/embeds/plotly-line.html
@@ -0,0 +1,84 @@
+
+<div id="line-ex-container-647b18ba">
+  <div>                            <div id="eacb4be4-822f-4675-a895-0b35bcfd8805" class="plotly-graph-div" style="height:100%; width:100%;"></div>            <script type="text/javascript">                                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById("eacb4be4-822f-4675-a895-0b35bcfd8805")) {                    Plotly.newPlot(                        "eacb4be4-822f-4675-a895-0b35bcfd8805",                        [{"hovertemplate":"\u003cb\u003e%{fullData.name}\u003c\u002fb\u003e\u003cbr\u003ex=%{x:.2f}\u003cbr\u003ey=%{y:.3f}\u003cextra\u003e\u003c\u002fextra\u003e","line":{"color":"#64748b","shape":"spline","smoothing":0.6,"width":2},"mode":"lines","name":"Baseline","showlegend":true,"x":[0.0,0.0041841004184100415,0.008368200836820083,0.012552301255230124,0.016736401673640166,0.02092050209205021,0.025104602510460247,0.02928870292887029,0.03347280334728033,0.03765690376569037,0.04184100418410042,0.046025104602510455,0.050209205020920494,0.05439330543933054,0.05857740585774058,0.06276150627615062,0.06694560669456066,0.0711297071129707,0.07531380753138074,0.0794979079497908,0.08368200836820083,0.08786610878661087,0.09205020920502091,0.09623430962343095,0.10041841004184099,0.10460251046025104,0.10878661087866108,0.11297071129707112,0.11715481171548116,0.1213389121338912,0.12552301255230125,0.12970711297071127,0.13389121338912133,0.13807531380753138,0.1422594142259414,0.14644351464435146,0.15062761506276148,0.15481171548117154,0.1589958158995816,0.1631799163179916,0.16736401673640167,0.1715481171548117,0.17573221757322174,0.1799163179916318,0.18410041841004182,0.18828451882845187,0.1924686192468619,0.19665271966527195,0.20083682008368198,0.20502092050209203,0.20920502092050208,0.2133891213389121,0.21757322175732216,0.22175732217573219,0.22594142259414224,0.2301255230125523,0.23430962343096232,0.23849372384937237,0.2426778242677824,0.24686192468619245,0.2510460251046025,0.25523012552301255,0.25941422594142255,0.2635983263598326,0.26778242677824265,0.2719665271966527,0.27615062761506276,0.28033472803347276,0.2845188284518828,0.28870292887029286,0.2928870292887029,0.29707112970711297,0.30125523012552297,0.305439330543933,0.30962343096234307,0.3138075313807531,0.3179916317991632,0.3221757322175732,0.3263598326359832,0.3305439330543933,0.33472803347280333,0.3389121338912134,0.3430962343096234,0.34728033472803344,0.3514644351464435,0.35564853556485354,0.3598326359832636,0.3640167364016736,0.36820083682008364,0.3723849372384937,0.37656903765690375,0.3807531380753138,0.3849372384937238,0.38912133891213385,0.3933054393305439,0.39748953974895396,0.40167364016736395,0.405857740585774,0.41004184100418406,0.4142259414225941,0.41841004184100417,0.42259414225941416,0.4267782426778242,0.43096234309623427,0.4351464435146443,0.4393305439330544,0.44351464435146437,0.4476987447698744,0.4518828451882845,0.45606694560669453,0.4602510460251046,0.4644351464435146,0.46861924686192463,0.4728033472803347,0.47698744769874474,0.4811715481171548,0.4853556485355648,0.48953974895397484,0.4937238493723849,0.49790794979079495,0.502092050209205,0.506276150627615,0.5104602510460251,0.5146443514644351,0.5188284518828451,0.5230125523012552,0.5271966527196652,0.5313807531380753,0.5355648535564853,0.5397489539748953,0.5439330543933054,0.5481171548117154,0.5523012552301255,0.5564853556485355,0.5606694560669455,0.5648535564853556,0.5690376569037656,0.5732217573221757,0.5774058577405857,0.5815899581589957,0.5857740585774058,0.5899581589958158,0.5941422594142259,0.5983263598326359,0.6025104602510459,0.606694560669456,0.610878661087866,0.6150627615062761,0.6192468619246861,0.6234309623430961,0.6276150627615062,0.6317991631799162,0.6359832635983264,0.6401673640167364,0.6443514644351463,0.6485355648535565,0.6527196652719665,0.6569037656903766,0.6610878661087866,0.6652719665271966,0.6694560669456067,0.6736401673640167,0.6778242677824268,0.6820083682008368,0.6861924686192468,0.6903765690376569,0.6945606694560669,0.698744769874477,0.702928870292887,0.707112970711297,0.7112970711297071,0.7154811715481171,0.7196652719665272,0.7238493723849372,0.7280334728033472,0.7322175732217573,0.7364016736401673,0.7405857740585774,0.7447698744769874,0.7489539748953974,0.7531380753138075,0.7573221757322175,0.7615062761506276,0.7656903765690376,0.7698744769874476,0.7740585774058577,0.7782426778242677,0.7824267782426778,0.7866108786610878,0.7907949790794978,0.7949790794979079,0.7991631799163179,0.8033472803347279,0.807531380753138,0.811715481171548,0.8158995815899581,0.8200836820083681,0.8242677824267781,0.8284518828451882,0.8326359832635982,0.8368200836820083,0.8410041841004183,0.8451882845188283,0.8493723849372384,0.8535564853556484,0.8577405857740585,0.8619246861924685,0.8661087866108785,0.8702928870292886,0.8744769874476986,0.8786610878661087,0.8828451882845187,0.8870292887029287,0.8912133891213389,0.8953974895397488,0.899581589958159,0.903765690376569,0.907949790794979,0.9121338912133891,0.9163179916317991,0.9205020920502092,0.9246861924686192,0.9288702928870292,0.9330543933054393,0.9372384937238493,0.9414225941422594,0.9456066945606694,0.9497907949790794,0.9539748953974895,0.9581589958158995,0.9623430962343096,0.9665271966527196,0.9707112970711296,0.9748953974895397,0.9790794979079497,0.9832635983263598,0.9874476987447698,0.9916317991631798,0.9958158995815899,1.0],"y":[0.10325611017271691,0.10339464908070704,0.1035390562715586,0.10368957804184283,0.10384647082790888,0.10401000160614818,0.10418044830755235,0.10435810024693962,0.10454325856722096,0.1047362366990729,0.10493736083637589,0.10514697042776965,0.10536541868466405,0.10559307310603182,0.10583031602029194,0.10607754514457322,0.10633517416162493,0.10660363331461449,0.10688337002002223,0.10717484949880761,0.10747855542598257,0.10779499059868251,0.10812467762277514,0.1084681596179913,0.10882600094149918,0.10919878792977272,0.10958712965852876,0.10999165872042038,0.11041303202008067,0.11085193158600631,0.11130906539865677,0.11178516823401995,0.11228100252175863,0.1127973592169032,0.11333505868389485,0.11389495159160672,0.114477919817781,0.11508487736111359,0.11571677125899543,0.11637458250868019,0.11705932698939046,0.117772056382598,0.11851385908741732,0.1192858611277356,0.12008922704736441,0.12092516078913879,0.1217949065535085,0.12269974963176174,0.12364101720859388,0.1246200791282849,0.12563834861827425,0.12669728296342733,0.12779838412376887,0.12894319928791798,0.1301333213539018,0.13137038932844328,0.13265608863522507,0.13399215132202053,0.13538035615596092,0.13682252859557953,0.13832054062763832,0.1398763104561116,0.14149180203007444,0.1431690243966304,0.14491003086442047,0.14671691796269073,0.14859182418036831,0.15053692846911637,0.15255444849391867,0.15464663861439287,0.1568157875797699,0.15906421592030787,0.1613942730178593,0.16380833383839039,0.16630879530947795,0.1688980723262078,0.17157859336947684,0.17435279572149145,0.1772231202642655,0.18019200584818182,0.18326188321920467,0.18643516849514025,0.1897142561834541,0.1931015117355877,0.19659926363548103,0.2002097950231238,0.2039353348574255,0.207778048626525,0.21174002861785352,0.21582328376481186,0.22002972909182084,0.22436117478472664,0.2288193149190735,0.23340571588455722,0.23812180455000417,0.24296885621943393,0.24794798243609284,0.2530601186977304,0.25830601215274074,0.2636862093530299,0.26920104414548673,0.2748506257896357,0.28063482739431467,0.28655327477093173,0.2926053358048954,0.29879011045004616,0.30510642145323597,0.31155280591747114,0.31812750781214627,0.3248284715377472,0.3316533366498935,0.3385994338436497,0.3456637822936055,0.3528430884382674,0.36013374628881456,0.36753183933226063,0.37503314408758337,0.38263313536051513,0.3903269932285346,0.3981096117723113,0.405975609553604,0.4139193418225966,0.42193491442011344,0.43001619932232193,0.4381568517577029,0.446350328808488,0.454589909391767,0.4628687154993053,0.4711797345600831,0.47951584277594816,0.48786982926879496,0.4962344208675833,0.504602307355484,0.5129661669916019,0.5213186921182653,0.5296526146637606,0.5379607313517324,0.5462359284321939,0.5544712057551259,0.5626597000159065,0.5707947070120986,0.5788697027632768,0.586878363359353,0.5948145834180083,0.6026724930481002,0.6104464732329847,0.6181311695653043,0.6257215042826447,0.6332126865712656,0.6406002211226275,0.6478799149443696,0.6550478824435727,0.6621005488153135,0.6690346517835489,0.6758472417541074,0.6825356804508947,0.6890976381162865,0.6955310893650131,0.7018343077876497,0.7080058594051007,0.7140445950792645,0.7199496419874267,0.72572039426896,0.7313565029526626,0.7368578652717028,0.7422246134707049,0.7474571032062077,0.7525559016376057,0.7575217753009073,0.7623556778523443,0.7670587377631131,0.7716322460404988,0.7760776440443701,0.7803965114616772,0.7845905544952088,0.7886615943165318,0.7926115558268515,0.7964424567635111,0.8001563971840802,0.8037555493544745,0.8072421480623625,0.810618481372249,0.813886881834114,0.8170497181533275,0.8201093873257699,0.8230683072386488,0.8259289097344318,0.8286936341325762,0.8313649212013411,0.833945207569883,0.836436920569059,0.8388424734878631,0.8411642612311867,0.8434046563636076,0.8455660055231439,0.8476506261883461,0.8496608037817258,0.8515987890923044,0.8534667959999981,0.8552669994846239,0.8570015339024812,0.8586724915137435,0.8602819212442462,0.8618318276656909,0.8633241701787625,0.8647608623841947,0.8661437716273805,0.8674747187027282,0.8687554777045662,0.869987776012039,0.8711732943960615,0.8723136672370364,0.8734104828426641,0.874465283855802,0.8754795677429297,0.8764547873543801,0.8773923515480664,0.8782936258689954,0.8791599332773964,0.8799925549188086,0.8807927309299669,0.8815616612747921,0.8823005066052454,0.8830103891422267,0.8836923935721009,0.8843475679548162,0.8849769246399327,0.8855814411872175,0.8861620612887775,0.8867196956899914,0.8872552231067824,0.8877694911370229,0.8882633171641062,0.888737489250938,0.889192767022802,0.8896298825377497,0.8900495411433326,0.8904524223186584,0.8908391805009009,0.8912104458955256],"type":"scatter"},{"hovertemplate":"\u003cb\u003e%{fullData.name}\u003c\u002fb\u003e\u003cbr\u003ex=%{x:.2f}\u003cbr\u003ey=%{y:.3f}\u003cextra\u003e\u003c\u002fextra\u003e","line":{"color":"#F981D4","shape":"spline","smoothing":0.6,"width":2},"mode":"lines","name":"Improved","showlegend":true,"x":[0.0,0.0041841004184100415,0.008368200836820083,0.012552301255230124,0.016736401673640166,0.02092050209205021,0.025104602510460247,0.02928870292887029,0.03347280334728033,0.03765690376569037,0.04184100418410042,0.046025104602510455,0.050209205020920494,0.05439330543933054,0.05857740585774058,0.06276150627615062,0.06694560669456066,0.0711297071129707,0.07531380753138074,0.0794979079497908,0.08368200836820083,0.08786610878661087,0.09205020920502091,0.09623430962343095,0.10041841004184099,0.10460251046025104,0.10878661087866108,0.11297071129707112,0.11715481171548116,0.1213389121338912,0.12552301255230125,0.12970711297071127,0.13389121338912133,0.13807531380753138,0.1422594142259414,0.14644351464435146,0.15062761506276148,0.15481171548117154,0.1589958158995816,0.1631799163179916,0.16736401673640167,0.1715481171548117,0.17573221757322174,0.1799163179916318,0.18410041841004182,0.18828451882845187,0.1924686192468619,0.19665271966527195,0.20083682008368198,0.20502092050209203,0.20920502092050208,0.2133891213389121,0.21757322175732216,0.22175732217573219,0.22594142259414224,0.2301255230125523,0.23430962343096232,0.23849372384937237,0.2426778242677824,0.24686192468619245,0.2510460251046025,0.25523012552301255,0.25941422594142255,0.2635983263598326,0.26778242677824265,0.2719665271966527,0.27615062761506276,0.28033472803347276,0.2845188284518828,0.28870292887029286,0.2928870292887029,0.29707112970711297,0.30125523012552297,0.305439330543933,0.30962343096234307,0.3138075313807531,0.3179916317991632,0.3221757322175732,0.3263598326359832,0.3305439330543933,0.33472803347280333,0.3389121338912134,0.3430962343096234,0.34728033472803344,0.3514644351464435,0.35564853556485354,0.3598326359832636,0.3640167364016736,0.36820083682008364,0.3723849372384937,0.37656903765690375,0.3807531380753138,0.3849372384937238,0.38912133891213385,0.3933054393305439,0.39748953974895396,0.40167364016736395,0.405857740585774,0.41004184100418406,0.4142259414225941,0.41841004184100417,0.42259414225941416,0.4267782426778242,0.43096234309623427,0.4351464435146443,0.4393305439330544,0.44351464435146437,0.4476987447698744,0.4518828451882845,0.45606694560669453,0.4602510460251046,0.4644351464435146,0.46861924686192463,0.4728033472803347,0.47698744769874474,0.4811715481171548,0.4853556485355648,0.48953974895397484,0.4937238493723849,0.49790794979079495,0.502092050209205,0.506276150627615,0.5104602510460251,0.5146443514644351,0.5188284518828451,0.5230125523012552,0.5271966527196652,0.5313807531380753,0.5355648535564853,0.5397489539748953,0.5439330543933054,0.5481171548117154,0.5523012552301255,0.5564853556485355,0.5606694560669455,0.5648535564853556,0.5690376569037656,0.5732217573221757,0.5774058577405857,0.5815899581589957,0.5857740585774058,0.5899581589958158,0.5941422594142259,0.5983263598326359,0.6025104602510459,0.606694560669456,0.610878661087866,0.6150627615062761,0.6192468619246861,0.6234309623430961,0.6276150627615062,0.6317991631799162,0.6359832635983264,0.6401673640167364,0.6443514644351463,0.6485355648535565,0.6527196652719665,0.6569037656903766,0.6610878661087866,0.6652719665271966,0.6694560669456067,0.6736401673640167,0.6778242677824268,0.6820083682008368,0.6861924686192468,0.6903765690376569,0.6945606694560669,0.698744769874477,0.702928870292887,0.707112970711297,0.7112970711297071,0.7154811715481171,0.7196652719665272,0.7238493723849372,0.7280334728033472,0.7322175732217573,0.7364016736401673,0.7405857740585774,0.7447698744769874,0.7489539748953974,0.7531380753138075,0.7573221757322175,0.7615062761506276,0.7656903765690376,0.7698744769874476,0.7740585774058577,0.7782426778242677,0.7824267782426778,0.7866108786610878,0.7907949790794978,0.7949790794979079,0.7991631799163179,0.8033472803347279,0.807531380753138,0.811715481171548,0.8158995815899581,0.8200836820083681,0.8242677824267781,0.8284518828451882,0.8326359832635982,0.8368200836820083,0.8410041841004183,0.8451882845188283,0.8493723849372384,0.8535564853556484,0.8577405857740585,0.8619246861924685,0.8661087866108785,0.8702928870292886,0.8744769874476986,0.8786610878661087,0.8828451882845187,0.8870292887029287,0.8912133891213389,0.8953974895397488,0.899581589958159,0.903765690376569,0.907949790794979,0.9121338912133891,0.9163179916317991,0.9205020920502092,0.9246861924686192,0.9288702928870292,0.9330543933054393,0.9372384937238493,0.9414225941422594,0.9456066945606694,0.9497907949790794,0.9539748953974895,0.9581589958158995,0.9623430962343096,0.9665271966527196,0.9707112970711296,0.9748953974895397,0.9790794979079497,0.9832635983263598,0.9874476987447698,0.9916317991631798,0.9958158995815899,1.0],"y":[0.14060501089565672,0.14088283778515465,0.14117437668125757,0.14148029457499495,0.14180128973406453,0.14213809304132727,0.1424914693767342,0.14286221904252114,0.14325117923128,0.14365922553626193,0.14408727350297595,0.14453628022082632,0.14500724595316689,0.14550121580375022,0.1460192814170989,0.14656258270983058,0.14713230962941984,0.14772970393627682,0.14835606100435697,0.1490127316347919,0.14970112387623702,0.15042270484476727,0.151179002535215,0.15197160761482742,0.15280217518902647,0.15367242652787275,0.15458415074057302,0.15553920638401897,0.1565395229899072,0.15758710249346727,0.15868402054521485,0.15983242768545844,0.1610345503595203,0.16229269174979818,0.16360923239889855,0.16498663059612784,0.1664274224976533,0.16793422194865357,0.16950971997379546,0.17115668390042355,0.17287795607696416,0.17467645214725785,0.17655515883988954,0.17851713123012414,0.1805654894308331,0.18270341466786982,0.18493414469478012,0.18726096850159143,0.18968722027278023,0.1922162725504525,0.1948515285603704,0.19759641366080336,0.20045436587736357,0.20342882549109012,0.20652322365216083,0.20974096999781483,0.21308543926043932,0.21655995686037258,0.2201677834878503,0.22391209868971296,0.22779598348899335,0.23182240207931556,0.23599418265109512,0.24031399742276002,0.2447843419674832,0.24940751394406385,0.25418559135939783,0.25912041050917184,0.264213543762687,0.2694662773766969,0.2748795895414215,0.2804541288790112,0.2861901936301986,0.2920877117781588,0.29814622236917493,0.30436485829703797,0.31074233082165825,0.317276916091671,0.32396644393541485,0.3308082891742017,0.3377993656960141,0.34493612350649583,0.35221454894733234,0.3596301682399747,0.36717805447542784,0.37485283812895587,0.38264872113267095,0.39055949448984884,0.39857855936337727,0.40669895151805197,0.4149133689436421,0.4232142024339775,0.43159356884802497,0.4400433467332665,0.4485552139508604,0.4571206869071671,0.46573116096821093,0.47437795161332363,0.48305233587216456,0.49174559358589653,0.5004490480386277,0.5091541055191895,0.5178522933955252,0.5265352963138058,0.535194990171079,0.5438234735527685,0.5524130963735796,0.5609564855110812,0.5694465672741473,0.5778765866022512,0.586240122945051,0.5945311028235718,0.6027438091235013,0.6108728872166885,0.6189133480480735,0.6268605683613184,0.6347102882669134,0.6424586063811748,0.6501019727832414,0.657637180049939,0.665061352635402,0.6723719348639443,0.679566677801265,0.6866436252611693,0.6936010991931518,0.7004376846810229,0.7071522147649059,0.7137437552790105,0.720211589876207,0.7265552053881889,0.7327742776474424,0.7388686578748471,0.7448383597149452,0.7506835469801073,0.7564045221453197,0.7620017156173483,0.7674756757858036,0.7728270598492599,0.778056625397137,0.7831652227175776,0.7881537877929914,0.7930233359382668,0.7977749560317459,0.8024098052858115,0.8069291045022122,0.8113341337568697,0.8156262284597393,0.8198067757371317,0.8238772110865894,0.8278390152577807,0.8316937113167614,0.8354428618552057,0.8390880663106919,0.842630958368713,0.8460732034216532,0.8494164960644374,0.852662557610846,0.8558131336185033,0.858869991414269,0.8618349176151412,0.8647097156427792,0.8674962032323732,0.870196209938834,0.872811574645113,0.8753441430789634,0.8777957653455672,0.8801682934842785,0.8824635790582229,0.8846834707857396,0.8868298122226409,0.8889044395040612,0.8909091791542693,0.892845845972296,0.8947162410005652,0.8965221495829927,0.8982653395181989,0.8999475593126457,0.901570536537641,0.9031359762932827,0.904645559781565,0.9061009429900344,0.9075037554865942,0.9088555993253137,0.9101580480623906,0.9114126458807956,0.9126209068215325,0.913784314118947,0.9149043196370531,0.9159823434034584,0.9170197732371421,0.918017964466056,0.918978239730313,0.9199018888665516,0.9207901688689508,0.9216443039222985,0.9224654855024788,0.9232548725397511,0.9240135916402323,0.9247427373610504,0.9254433725347414,0.9261165286385616,0.9267632062045259,0.9273843752661248,0.9279809758378323,0.9285539184236826,0.9291040845513728,0.9296323273285203,0.9301394720178946,0.9306263166286217,0.9310936325205441,0.9315421650191003,0.9319726340382659,0.9323857347092799,0.9327821380130337,0.9331624914141858,0.9335274194952079,0.9338775245887276,0.9342133874066783,0.9345355676649034,0.9348446047019983,0.9351410180912925,0.9354253082449973,0.9356979570096523,0.935959428252111,0.9362101684353965,0.9364506071838582,0.9366811578371357,0.9369022179925198,0.9371141700353723,0.9373173816573281,0.9375122063620713,0.9376989839585275,0.9378780410413667,0.9380496914587627,0.9382142367673885,0.9383719666746729,0.9385231594683747,0.9386680824335623,0.9388069922571125,0.9389401354198723],"type":"scatter"},{"hovertemplate":"\u003cb\u003e%{fullData.name}\u003c\u002fb\u003e\u003cbr\u003ex=%{x:.2f}\u003cbr\u003ey=%{y:.3f}\u003cextra\u003e\u003c\u002fextra\u003e","line":{"color":"#4b5563","dash":"dash","width":2},"mode":"lines","name":"Target","showlegend":true,"x":[0.0,0.0041841004184100415,0.008368200836820083,0.012552301255230124,0.016736401673640166,0.02092050209205021,0.025104602510460247,0.02928870292887029,0.03347280334728033,0.03765690376569037,0.04184100418410042,0.046025104602510455,0.050209205020920494,0.05439330543933054,0.05857740585774058,0.06276150627615062,0.06694560669456066,0.0711297071129707,0.07531380753138074,0.0794979079497908,0.08368200836820083,0.08786610878661087,0.09205020920502091,0.09623430962343095,0.10041841004184099,0.10460251046025104,0.10878661087866108,0.11297071129707112,0.11715481171548116,0.1213389121338912,0.12552301255230125,0.12970711297071127,0.13389121338912133,0.13807531380753138,0.1422594142259414,0.14644351464435146,0.15062761506276148,0.15481171548117154,0.1589958158995816,0.1631799163179916,0.16736401673640167,0.1715481171548117,0.17573221757322174,0.1799163179916318,0.18410041841004182,0.18828451882845187,0.1924686192468619,0.19665271966527195,0.20083682008368198,0.20502092050209203,0.20920502092050208,0.2133891213389121,0.21757322175732216,0.22175732217573219,0.22594142259414224,0.2301255230125523,0.23430962343096232,0.23849372384937237,0.2426778242677824,0.24686192468619245,0.2510460251046025,0.25523012552301255,0.25941422594142255,0.2635983263598326,0.26778242677824265,0.2719665271966527,0.27615062761506276,0.28033472803347276,0.2845188284518828,0.28870292887029286,0.2928870292887029,0.29707112970711297,0.30125523012552297,0.305439330543933,0.30962343096234307,0.3138075313807531,0.3179916317991632,0.3221757322175732,0.3263598326359832,0.3305439330543933,0.33472803347280333,0.3389121338912134,0.3430962343096234,0.34728033472803344,0.3514644351464435,0.35564853556485354,0.3598326359832636,0.3640167364016736,0.36820083682008364,0.3723849372384937,0.37656903765690375,0.3807531380753138,0.3849372384937238,0.38912133891213385,0.3933054393305439,0.39748953974895396,0.40167364016736395,0.405857740585774,0.41004184100418406,0.4142259414225941,0.41841004184100417,0.42259414225941416,0.4267782426778242,0.43096234309623427,0.4351464435146443,0.4393305439330544,0.44351464435146437,0.4476987447698744,0.4518828451882845,0.45606694560669453,0.4602510460251046,0.4644351464435146,0.46861924686192463,0.4728033472803347,0.47698744769874474,0.4811715481171548,0.4853556485355648,0.48953974895397484,0.4937238493723849,0.49790794979079495,0.502092050209205,0.506276150627615,0.5104602510460251,0.5146443514644351,0.5188284518828451,0.5230125523012552,0.5271966527196652,0.5313807531380753,0.5355648535564853,0.5397489539748953,0.5439330543933054,0.5481171548117154,0.5523012552301255,0.5564853556485355,0.5606694560669455,0.5648535564853556,0.5690376569037656,0.5732217573221757,0.5774058577405857,0.5815899581589957,0.5857740585774058,0.5899581589958158,0.5941422594142259,0.5983263598326359,0.6025104602510459,0.606694560669456,0.610878661087866,0.6150627615062761,0.6192468619246861,0.6234309623430961,0.6276150627615062,0.6317991631799162,0.6359832635983264,0.6401673640167364,0.6443514644351463,0.6485355648535565,0.6527196652719665,0.6569037656903766,0.6610878661087866,0.6652719665271966,0.6694560669456067,0.6736401673640167,0.6778242677824268,0.6820083682008368,0.6861924686192468,0.6903765690376569,0.6945606694560669,0.698744769874477,0.702928870292887,0.707112970711297,0.7112970711297071,0.7154811715481171,0.7196652719665272,0.7238493723849372,0.7280334728033472,0.7322175732217573,0.7364016736401673,0.7405857740585774,0.7447698744769874,0.7489539748953974,0.7531380753138075,0.7573221757322175,0.7615062761506276,0.7656903765690376,0.7698744769874476,0.7740585774058577,0.7782426778242677,0.7824267782426778,0.7866108786610878,0.7907949790794978,0.7949790794979079,0.7991631799163179,0.8033472803347279,0.807531380753138,0.811715481171548,0.8158995815899581,0.8200836820083681,0.8242677824267781,0.8284518828451882,0.8326359832635982,0.8368200836820083,0.8410041841004183,0.8451882845188283,0.8493723849372384,0.8535564853556484,0.8577405857740585,0.8619246861924685,0.8661087866108785,0.8702928870292886,0.8744769874476986,0.8786610878661087,0.8828451882845187,0.8870292887029287,0.8912133891213389,0.8953974895397488,0.899581589958159,0.903765690376569,0.907949790794979,0.9121338912133891,0.9163179916317991,0.9205020920502092,0.9246861924686192,0.9288702928870292,0.9330543933054393,0.9372384937238493,0.9414225941422594,0.9456066945606694,0.9497907949790794,0.9539748953974895,0.9581589958158995,0.9623430962343096,0.9665271966527196,0.9707112970711296,0.9748953974895397,0.9790794979079497,0.9832635983263598,0.9874476987447698,0.9916317991631798,0.9958158995815899,1.0],"y":[0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97,0.97],"type":"scatter"}],                        {"template":{"data":{"histogram2dcontour":[{"type":"histogram2dcontour","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"choropleth":[{"type":"choropleth","colorbar":{"outlinewidth":0,"ticks":""}}],"histogram2d":[{"type":"histogram2d","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"heatmap":[{"type":"heatmap","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"heatmapgl":[{"type":"heatmapgl","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"contourcarpet":[{"type":"contourcarpet","colorbar":{"outlinewidth":0,"ticks":""}}],"contour":[{"type":"contour","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"surface":[{"type":"surface","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"mesh3d":[{"type":"mesh3d","colorbar":{"outlinewidth":0,"ticks":""}}],"scatter":[{"fillpattern":{"fillmode":"overlay","size":10,"solidity":0.2},"type":"scatter"}],"parcoords":[{"type":"parcoords","line":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterpolargl":[{"type":"scatterpolargl","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"bar":[{"error_x":{"color":"#2a3f5f"},"error_y":{"color":"#2a3f5f"},"marker":{"line":{"color":"#E5ECF6","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"bar"}],"scattergeo":[{"type":"scattergeo","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterpolar":[{"type":"scatterpolar","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"histogram":[{"marker":{"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"histogram"}],"scattergl":[{"type":"scattergl","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatter3d":[{"type":"scatter3d","line":{"colorbar":{"outlinewidth":0,"ticks":""}},"marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scattermapbox":[{"type":"scattermapbox","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterternary":[{"type":"scatterternary","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scattercarpet":[{"type":"scattercarpet","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"carpet":[{"aaxis":{"endlinecolor":"#2a3f5f","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"#2a3f5f"},"baxis":{"endlinecolor":"#2a3f5f","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"#2a3f5f"},"type":"carpet"}],"table":[{"cells":{"fill":{"color":"#EBF0F8"},"line":{"color":"white"}},"header":{"fill":{"color":"#C8D4E3"},"line":{"color":"white"}},"type":"table"}],"barpolar":[{"marker":{"line":{"color":"#E5ECF6","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"barpolar"}],"pie":[{"automargin":true,"type":"pie"}]},"layout":{"autotypenumbers":"strict","colorway":["#636efa","#EF553B","#00cc96","#ab63fa","#FFA15A","#19d3f3","#FF6692","#B6E880","#FF97FF","#FECB52"],"font":{"color":"#2a3f5f"},"hovermode":"closest","hoverlabel":{"align":"left"},"paper_bgcolor":"white","plot_bgcolor":"#E5ECF6","polar":{"bgcolor":"#E5ECF6","angularaxis":{"gridcolor":"white","linecolor":"white","ticks":""},"radialaxis":{"gridcolor":"white","linecolor":"white","ticks":""}},"ternary":{"bgcolor":"#E5ECF6","aaxis":{"gridcolor":"white","linecolor":"white","ticks":""},"baxis":{"gridcolor":"white","linecolor":"white","ticks":""},"caxis":{"gridcolor":"white","linecolor":"white","ticks":""}},"coloraxis":{"colorbar":{"outlinewidth":0,"ticks":""}},"colorscale":{"sequential":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]],"sequentialminus":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]],"diverging":[[0,"#8e0152"],[0.1,"#c51b7d"],[0.2,"#de77ae"],[0.3,"#f1b6da"],[0.4,"#fde0ef"],[0.5,"#f7f7f7"],[0.6,"#e6f5d0"],[0.7,"#b8e186"],[0.8,"#7fbc41"],[0.9,"#4d9221"],[1,"#276419"]]},"xaxis":{"gridcolor":"white","linecolor":"white","ticks":"","title":{"standoff":15},"zerolinecolor":"white","automargin":true,"zerolinewidth":2},"yaxis":{"gridcolor":"white","linecolor":"white","ticks":"","title":{"standoff":15},"zerolinecolor":"white","automargin":true,"zerolinewidth":2},"scene":{"xaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2},"yaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2},"zaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2}},"shapedefaults":{"line":{"color":"#2a3f5f"}},"annotationdefaults":{"arrowcolor":"#2a3f5f","arrowhead":0,"arrowwidth":1},"geo":{"bgcolor":"white","landcolor":"#E5ECF6","subunitcolor":"white","showland":true,"showlakes":true,"lakecolor":"white"},"title":{"x":0.05},"mapbox":{"style":"light"}}},"margin":{"l":40,"r":28,"t":20,"b":40},"legend":{"orientation":"v","x":1,"y":0,"xanchor":"right","yanchor":"bottom","bgcolor":"rgba(255,255,255,0)","borderwidth":0},"hoverlabel":{"font":{"color":"#111827","size":12},"bgcolor":"white","bordercolor":"rgba(0,0,0,0.15)","align":"left","namelength":-1},"xaxis":{"tickfont":{"size":12,"color":"rgba(0,0,0,0.55)"},"showgrid":false,"zeroline":false,"showline":true,"linecolor":"rgba(0,0,0,0.25)","linewidth":1,"ticks":"outside","ticklen":6,"tickcolor":"rgba(0,0,0,0.25)","title":{},"automargin":true,"fixedrange":true},"yaxis":{"tickfont":{"size":12,"color":"rgba(0,0,0,0.55)"},"showgrid":false,"zeroline":false,"showline":true,"linecolor":"rgba(0,0,0,0.25)","linewidth":1,"ticks":"outside","ticklen":6,"tickcolor":"rgba(0,0,0,0.25)","title":{},"tickformat":".2f","rangemode":"tozero","automargin":true,"fixedrange":true},"autosize":true,"paper_bgcolor":"rgba(0,0,0,0)","plot_bgcolor":"rgba(0,0,0,0)","hovermode":"x unified"},                        {"displayModeBar": false, "responsive": true, "scrollZoom": false, "doubleClick": false, "modeBarButtonsToRemove": ["zoom2d", "pan2d", "select2d", "lasso2d", "zoomIn2d", "zoomOut2d", "autoScale2d", "resetScale2d", "toggleSpikelines"]}                    ).then(function(){
+                            
+(function(){
+  function attach(gd){
+    function round(){
+      try {
+        var root = gd && gd.parentNode ? gd.parentNode : document;
+        var rects = root.querySelectorAll('.hoverlayer .hovertext rect');
+        rects.forEach(function(r){ r.setAttribute('rx', 8); r.setAttribute('ry', 8); });
+      } catch(e) {}
+    }
+    if (gd && gd.on) {
+      gd.on('plotly_hover', round);
+      gd.on('plotly_unhover', round);
+      gd.on('plotly_relayout', round);
+    }
+    setTimeout(round, 0);
+  }
+  var plots = document.querySelectorAll('.js-plotly-plot');
+  plots.forEach(attach);
+})();
+
+                        })                };                            </script>        </div>
+  <div class="plotly_controls" style="margin-top:12px; display:flex; gap:16px; align-items:center;">
+    <label style="font-size:12px;color:rgba(0,0,0,.65); display:flex; align-items:center; gap:6px; white-space:nowrap; padding:6px 10px;">
+      Dataset
+      <select id="__DSID__" style="font-size:12px; padding:2px 6px;">
+        <option value="0">CIFAR-10</option>
+        <option value="1">CIFAR-100</option>
+        <option value="2">ImageNet-1K</option>
+      </select>
+    </label>
+    <label style="font-size:12px;color:rgba(0,0,0,.65);display:flex;align-items:center;gap:10px; flex:1; padding:6px 10px;">
+      Augmentation α
+      <input id="line-ex-alpha-647b18ba" type="range" min="0" max="1" step="0.01" value="0.70" style="flex:1;">
+      <span class="alpha-value">0.70</span>
+    </label>
+  </div>
+</div>
+<script>
+(function(){
+  var container = document.getElementById('line-ex-container-647b18ba');
+  if(!container) return;
+  var gd = container.querySelector('.js-plotly-plot');
+  var slider = document.getElementById('line-ex-alpha-647b18ba');
+  var dsSelect = document.getElementById('__DSID__');
+  var valueEl = container.querySelector('.alpha-value');
+  var N = 240;
+  var xs = Array.from({length: N}, function(_,i){ return i/(N-1); });
+  function logistic(x, ymin, ymax, k, x0){ return ymin + (ymax - ymin) / (1 + Math.exp(-k*(x - x0))); }
+  function blend(l,e,a){ return (1-a)*l + a*e; }
+  var datasets = [
+    { name:'CIFAR-10',  base:{ymin:0.10,ymax:0.90,k:10.0,x0:0.55}, aug:{ymin:0.15,ymax:0.96,k:12.0,x0:0.40}, target:0.97 },
+    { name:'CIFAR-100', base:{ymin:0.05,ymax:0.70,k:9.5,x0:0.60},  aug:{ymin:0.08,ymax:0.80,k:11.0,x0:0.45},  target:0.85 },
+    { name:'ImageNet-1K', base:{ymin:0.02,ymax:0.68,k:8.5,x0:0.65}, aug:{ymin:0.04,ymax:0.75,k:9.5,x0:0.50},  target:0.82 }
+  ];
+  var dsi = 0;
+  var yb = xs.map(function(x){ return logistic(x, datasets[dsi].base.ymin, datasets[dsi].base.ymax, datasets[dsi].base.k, datasets[dsi].base.x0); });
+  var ya = xs.map(function(x){ return logistic(x, datasets[dsi].aug.ymin, datasets[dsi].aug.ymax, datasets[dsi].aug.k, datasets[dsi].aug.x0); });
+  var yt = xs.map(function(){ return datasets[dsi].target; });
+  function applyAlpha(a){
+    var yi = yb.map(function(v,i){ return blend(v, ya[i], a); });
+    Plotly.restyle(gd, {y:[yi]}, [1]); // only Improved changes with α
+    if(valueEl) valueEl.textContent = a.toFixed(2);
+  }
+  function applyDataset(){
+    var d = datasets[dsi];
+    yb = xs.map(function(x){ return logistic(x, d.base.ymin, d.base.ymax, d.base.k, d.base.x0); });
+    ya = xs.map(function(x){ return logistic(x, d.aug.ymin, d.aug.ymax, d.aug.k, d.aug.x0); });
+    yt = xs.map(function(){ return d.target; });
+    var a = parseFloat(slider.value)||0;
+    var yi = yb.map(function(v,i){ return blend(v, ya[i], a); });
+    Plotly.restyle(gd, {y:[yb]}, [0]); // Baseline
+    Plotly.restyle(gd, {y:[yi]}, [1]); // Improved (blended)
+    Plotly.restyle(gd, {y:[yt]}, [2]); // Target
+  }
+  var initA = parseFloat(slider.value)||0;
+  slider.addEventListener('input', function(e){ applyAlpha(parseFloat(e.target.value)||0); });
+  dsSelect.addEventListener('change', function(e){ dsi = parseInt(e.target.value)||0; applyDataset(); });
+  setTimeout(function(){ applyDataset(); applyAlpha(initA); }, 0);
+})();
+</script>
diff --git a/app/src/content/embeds/throughput-debug-1node.html b/app/src/content/embeds/throughput-debug-1node.html
new file mode 100644
index 0000000000000000000000000000000000000000..c4c4bc8be805b4a17adaed28a894e153186e9f5d
--- /dev/null
+++ b/app/src/content/embeds/throughput-debug-1node.html
@@ -0,0 +1,352 @@
+<div class="throughput-debug-1node"></div>
+<style>
+  .throughput-debug-1node { position: relative; }
+  .throughput-debug-1node .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .throughput-debug-1node .axes path, .throughput-debug-1node .axes line { stroke: var(--axis-color); }
+  .throughput-debug-1node .axes text { fill: var(--tick-color); }
+  .throughput-debug-1node .grid line { stroke: var(--grid-color); }
+  .throughput-debug-1node .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  .throughput-debug-1node .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+  .throughput-debug-1node .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .throughput-debug-1node .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .throughput-debug-1node .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .throughput-debug-1node .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .throughput-debug-1node .legend-bottom .legend-title { font-size: 12px; font-weight: 700; color: var(--text-color); }
+  .throughput-debug-1node .legend-bottom { flex-direction: column; align-items: flex-start; gap: 6px; }
+  .throughput-debug-1node .lines path.active { stroke-width: 3; }
+  .throughput-debug-1node .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .throughput-debug-1node .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .throughput-debug-1node .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .throughput-debug-1node .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .throughput-debug-1node .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+  /* Ghosting on hover */
+  .throughput-debug-1node.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .throughput-debug-1node.hovering .lines path.ghost { opacity: .25; }
+  .throughput-debug-1node.hovering .points circle.ghost { opacity: .25; }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('throughput-debug-1node'))){
+        const cs = Array.from(document.querySelectorAll('.throughput-debug-1node')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 80 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.step)).y(d => yScale(d.value));
+      let data = [];
+
+      // Colors - following guidelines to use ColorPalettes
+      let currentColors = ['var(--primary-color, #4e79a7)', 'var(--primary-color, #4e79a7)'];
+      
+      function refreshPalette(){
+        try { 
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            const colors = window.ColorPalettes.getColors('categorical', 2);
+            if (colors && colors.length >= 2) {
+              currentColors = colors;
+              // Re-render with new colors
+              if (data.length > 0) render();
+              return;
+            }
+          }
+        } catch(_){}
+        // Fallback to CSS variable or default
+        currentColors = ['var(--primary-color, #4e79a7)', '#e15759'];
+        // Re-render with fallback colors
+        if (data.length > 0) render();
+      }
+      
+      function getColors(){
+        return currentColors;
+      }
+      
+      // Format helper for thousands (5000 -> 5k, 1500 -> 1.5k)
+      function formatK(v){
+        const abs = Math.abs(v);
+        if (abs >= 1000) {
+          const n = v / 1000;
+          const s = d3.format('.1f')(n);
+          return (s.endsWith('.0') ? s.slice(0, -2) : s) + 'k';
+        }
+        return d3.format('d')(v);
+      }
+
+      // Format helper for throughput values
+      function formatThroughput(v){
+        if (v >= 1000) {
+          return d3.format('.1f')(v / 1000) + 'k';
+        }
+        return d3.format('.1f')(v);
+      }
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(){
+        if (data.length === 0) return;
+        
+        const { innerWidth, innerHeight } = updateLayout();
+        
+        // Sort data by step
+        const sortedData = data.slice().sort((a, b) => a.step - b.step);
+        
+        // Prepare series data - filter out empty values
+        const series = [
+          {
+            name: 'Throughput for 32k steps',
+            values: sortedData
+              .filter(d => d.run1 !== null && d.run1 !== undefined && d.run1 !== '')
+              .map(d => ({ step: d.step, value: d.run1 }))
+          },
+          {
+            name: 'Throughput for 3.2M steps',
+            values: sortedData
+              .filter(d => d.run2 !== null && d.run2 !== undefined && d.run2 !== '')
+              .map(d => ({ step: d.step, value: d.run2 }))
+          }
+        ];
+        
+        // domains
+        const allValues = [...series[0].values, ...series[1].values];
+        if (allValues.length === 0) return;
+        
+        const minStep = d3.min(allValues, d => d.step);
+        const maxStep = d3.max(allValues, d => d.step);
+        const minValue = d3.min(allValues, d => d.value);
+        const maxValue = d3.max(allValues, d => d.value);
+        
+        xScale.domain([minStep, maxStep]).range([0, innerWidth]);
+        yScale.domain([minValue, maxValue]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatK)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6).tickFormat(formatThroughput)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Training Step');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-60}, ${innerHeight/2}) rotate(-90)`).text('Tokens/sec/GPU');
+
+        // lines
+        const colors = getColors();
+        gLines.selectAll('*').remove();
+        series.forEach((s, i) => {
+          if (s.values.length > 0) {
+            gLines.append('path')
+              .attr('class', `line line-${i}`)
+              .attr('data-series', s.name)
+              .attr('fill','none')
+              .attr('stroke', colors[i % colors.length])
+              .attr('stroke-width', 2)
+              .attr('d', lineGen(s.values));
+          }
+        });
+
+        // point markers
+        gPoints.selectAll('*').remove();
+        series.forEach((s, i) => {
+          if (s.values.length > 0) {
+            gPoints.selectAll(`circle.point-${i}`).data(s.values).join('circle')
+              .attr('class', `point point-${i}`)
+              .attr('data-series', s.name)
+              .attr('r', 2)
+              .attr('fill', colors[i % colors.length])
+              .attr('fill-opacity', 0.6)
+              .attr('cx', d=>xScale(d.step))
+              .attr('cy', d=>yScale(d.value));
+          }
+        });
+
+        // legend
+        const validSeries = series.filter(s => s.values.length > 0);
+        legendBottom.innerHTML = `<div class="legend-title">Legend</div><div class="items">${validSeries.map((s, i) => `<span class="item" data-series="${s.name}"><span class="swatch" style="background:${colors[i % colors.length]}"></span><span>${s.name}</span></span>`).join('')}</div>`;
+
+        // Legend hover → ghost lines/points
+        try {
+          const legendNode = legendBottom;
+          legendNode.querySelectorAll('.item').forEach(el => {
+            el.addEventListener('mouseenter', () => {
+              const seriesName = el.getAttribute('data-series'); if (!seriesName) return;
+              container.classList.add('hovering');
+              gLines.selectAll('path.line').classed('ghost', s => s.getAttribute && s.getAttribute('data-series') !== seriesName);
+              gPoints.selectAll('circle.point').classed('ghost', p => p.getAttribute && p.getAttribute('data-series') !== seriesName);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-series') !== seriesName));
+            });
+            el.addEventListener('mouseleave', () => {
+              container.classList.remove('hovering');
+              gLines.selectAll('path.line').classed('ghost', false);
+              gPoints.selectAll('circle.point').classed('ghost', false);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+            });
+          });
+        } catch {}
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          
+          // Find nearest step
+          const steps = Array.from(new Set(allValues.map(d => d.step))).sort((a,b) => a - b);
+          const nearest = steps.reduce((best, s) => Math.abs(s - sx) < Math.abs(best - sx) ? s : best, steps[0]);
+          const xpx = xScale(nearest);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          
+          // Find data point for this step
+          const dataPoint = sortedData.find(d => d.step === nearest);
+          if (!dataPoint) return;
+          
+          // tooltip content
+          let html = `<div style="font-weight:800;letter-spacing:.1px;">Throughput Debug (1 Node)</div><div style="font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;">Step ${formatK(nearest)}</div>`;
+          
+          validSeries.forEach((s, i) => {
+            const value = s.name === 'Throughput for 32k steps' ? dataPoint.run1 : dataPoint.run2;
+            if (value !== null && value !== undefined && value !== '') {
+              html += `<div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><span class="d3-tooltip__color-dot" style="background:${colors[i % colors.length]}"></span><strong>${s.name}</strong><span style="margin-left:auto;">${formatThroughput(value)}</span></div>`;
+            }
+          });
+          
+          tipInner.innerHTML = html; 
+          tip.style.opacity = '1'; 
+          tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        
+        function onLeave(){ 
+          tip.style.opacity='0'; 
+          tip.style.transform='translate(-9999px, -9999px)'; 
+          hoverLine.style('display','none'); 
+        }
+        
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          // Try multiple possible paths for the CSV file
+          const csvPaths = [
+            '/data/throughput_debug_1node.csv',
+            './assets/data/throughput_debug_1node.csv',
+            '../assets/data/throughput_debug_1node.csv',
+            '../../assets/data/throughput_debug_1node.csv'
+          ];
+          
+          let csvText = null;
+          for (const path of csvPaths) {
+            try {
+              const response = await fetch(path, { cache: 'no-cache' });
+              if (response.ok) {
+                csvText = await response.text();
+                break;
+              }
+            } catch(_) {}
+          }
+          
+          if (!csvText) {
+            throw new Error('CSV file not found: throughput_debug_1node.csv');
+          }
+          
+          const rows = d3.csvParse(csvText);
+          
+          // Parse the data - use the two main columns (without Min/Max)
+          const col1 = "06/04/2025_19:54:26_3B-nanotron-old-nn1-fwedu-32k - tokens_per_sec_per_gpu";
+          const col2 = "06/04/2025_19:50:35_3B-nanotron-old-nn1-fwedu- - tokens_per_sec_per_gpu";
+          
+          data = rows.map(d => ({
+            step: +d.Step,
+            run1: d[col1] === '' ? null : +d[col1],
+            run2: d[col2] === '' ? null : +d[col2]
+          })).filter(d => !isNaN(d.step));
+          
+          // Initialize palette and listen for changes
+          refreshPalette();
+          document.addEventListener('palettes:updated', refreshPalette);
+          
+          render();
+          
+          const rerender = () => render();
+          if (window.ResizeObserver) { 
+            const ro = new ResizeObserver(() => rerender()); 
+            ro.observe(container); 
+          } else { 
+            window.addEventListener('resize', rerender); 
+          }
+        } catch (e) {
+          const pre = document.createElement('pre'); 
+          pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; 
+          pre.style.fontSize = '12px'; 
+          pre.style.whiteSpace = 'pre-wrap'; 
+          container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { 
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); 
+    } else { 
+      ensureD3(bootstrap); 
+    }
+  })();
+</script>
diff --git a/app/src/content/embeds/throughput-drops-comparison.html b/app/src/content/embeds/throughput-drops-comparison.html
new file mode 100644
index 0000000000000000000000000000000000000000..96a4dd5037599471e622812f1bc3ce51d5f03f1d
--- /dev/null
+++ b/app/src/content/embeds/throughput-drops-comparison.html
@@ -0,0 +1,335 @@
+<div class="throughput-drops-comparison"></div>
+<style>
+  .throughput-drops-comparison { position: relative; }
+  .throughput-drops-comparison .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .throughput-drops-comparison .axes path, .throughput-drops-comparison .axes line { stroke: var(--axis-color); }
+  .throughput-drops-comparison .axes text { fill: var(--tick-color); }
+  .throughput-drops-comparison .grid line { stroke: var(--grid-color); }
+  .throughput-drops-comparison .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  .throughput-drops-comparison .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+  .throughput-drops-comparison .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .throughput-drops-comparison .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .throughput-drops-comparison .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .throughput-drops-comparison .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .throughput-drops-comparison .legend-bottom .legend-title { font-size: 12px; font-weight: 700; color: var(--text-color); }
+  .throughput-drops-comparison .legend-bottom { flex-direction: column; align-items: flex-start; gap: 6px; }
+  .throughput-drops-comparison .lines path.active { stroke-width: 3; }
+  .throughput-drops-comparison .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .throughput-drops-comparison .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .throughput-drops-comparison .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .throughput-drops-comparison .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .throughput-drops-comparison .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+  /* Ghosting on hover */
+  .throughput-drops-comparison.hovering .legend-bottom .item.ghost { opacity: .35; }
+  .throughput-drops-comparison.hovering .lines path.ghost { opacity: .25; }
+  .throughput-drops-comparison.hovering .points circle.ghost { opacity: .25; }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('throughput-drops-comparison'))){
+        const cs = Array.from(document.querySelectorAll('.throughput-drops-comparison')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 80 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.step)).y(d => yScale(d.value));
+      let data = [];
+
+      // Colors - following guidelines to use ColorPalettes
+      let currentColors = ['var(--primary-color, #4e79a7)', 'var(--primary-color, #4e79a7)'];
+      
+      function refreshPalette(){
+        try { 
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            const colors = window.ColorPalettes.getColors('categorical', 2);
+            if (colors && colors.length >= 2) {
+              currentColors = colors;
+              // Re-render with new colors
+              if (data.length > 0) render();
+              return;
+            }
+          }
+        } catch(_){}
+        // Fallback to CSS variable or default
+        currentColors = ['var(--primary-color, #4e79a7)', '#e15759'];
+        // Re-render with fallback colors
+        if (data.length > 0) render();
+      }
+      
+      function getColors(){
+        return currentColors;
+      }
+      
+      // Format helper for thousands (5000 -> 5k, 1500 -> 1.5k)
+      function formatK(v){
+        const abs = Math.abs(v);
+        if (abs >= 1000) {
+          const n = v / 1000;
+          const s = d3.format('.1f')(n);
+          return (s.endsWith('.0') ? s.slice(0, -2) : s) + 'k';
+        }
+        return d3.format('d')(v);
+      }
+
+      // Format helper for throughput values
+      function formatThroughput(v){
+        if (v >= 1000) {
+          return d3.format('.1f')(v / 1000) + 'k';
+        }
+        return d3.format('.1f')(v);
+      }
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(){
+        if (data.length === 0) return;
+        
+        const { innerWidth, innerHeight } = updateLayout();
+        
+        // Sort data by step
+        const sortedData = data.slice().sort((a, b) => a.step - b.step);
+        
+        // Prepare series data
+        const series = [
+          {
+            name: 'Throughput (main run)',
+            values: sortedData.map(d => ({ step: d.step, value: d.throughput_drops }))
+          },
+          {
+            name: 'Throughput (ablations)',
+            values: sortedData.map(d => ({ step: d.step, value: d.throughput_no_drops }))
+          }
+        ];
+        
+        // domains
+        const minStep = d3.min(sortedData, d => d.step);
+        const maxStep = d3.max(sortedData, d => d.step);
+        const minValue = d3.min(sortedData, d => Math.min(d.throughput_drops, d.throughput_no_drops));
+        const maxValue = d3.max(sortedData, d => Math.max(d.throughput_drops, d.throughput_no_drops));
+        
+        xScale.domain([minStep, maxStep]).range([0, innerWidth]);
+        yScale.domain([minValue, maxValue]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatK)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6).tickFormat(formatThroughput)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Training Step');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-60}, ${innerHeight/2}) rotate(-90)`).text('Tokens/sec/GPU');
+
+        // lines
+        const colors = getColors();
+        gLines.selectAll('*').remove();
+        series.forEach((s, i) => {
+          gLines.append('path')
+            .attr('class', `line line-${i}`)
+            .attr('data-series', s.name)
+            .attr('fill','none')
+            .attr('stroke', colors[i % colors.length])
+            .attr('stroke-width', 2)
+            .attr('d', lineGen(s.values));
+        });
+
+        // point markers
+        gPoints.selectAll('*').remove();
+        series.forEach((s, i) => {
+          gPoints.selectAll(`circle.point-${i}`).data(s.values).join('circle')
+            .attr('class', `point point-${i}`)
+            .attr('data-series', s.name)
+            .attr('r', 2)
+            .attr('fill', colors[i % colors.length])
+            .attr('fill-opacity', 0.6)
+            .attr('cx', d=>xScale(d.step))
+            .attr('cy', d=>yScale(d.value));
+        });
+
+        // legend
+        legendBottom.innerHTML = `<div class="legend-title">Legend</div><div class="items">${series.map((s, i) => `<span class="item" data-series="${s.name}"><span class="swatch" style="background:${colors[i % colors.length]}"></span><span>${s.name}</span></span>`).join('')}</div>`;
+
+        // Legend hover → ghost lines/points
+        try {
+          const legendNode = legendBottom;
+          legendNode.querySelectorAll('.item').forEach(el => {
+            el.addEventListener('mouseenter', () => {
+              const seriesName = el.getAttribute('data-series'); if (!seriesName) return;
+              container.classList.add('hovering');
+              gLines.selectAll('path.line').classed('ghost', s => s.getAttribute && s.getAttribute('data-series') !== seriesName);
+              gPoints.selectAll('circle.point').classed('ghost', p => p.getAttribute && p.getAttribute('data-series') !== seriesName);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.toggle('ghost', it.getAttribute('data-series') !== seriesName));
+            });
+            el.addEventListener('mouseleave', () => {
+              container.classList.remove('hovering');
+              gLines.selectAll('path.line').classed('ghost', false);
+              gPoints.selectAll('circle.point').classed('ghost', false);
+              legendNode.querySelectorAll('.item').forEach(it => it.classList.remove('ghost'));
+            });
+          });
+        } catch {}
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          
+          // Find nearest step
+          const steps = Array.from(new Set(sortedData.map(d => d.step))).sort((a,b) => a - b);
+          const nearest = steps.reduce((best, s) => Math.abs(s - sx) < Math.abs(best - sx) ? s : best, steps[0]);
+          const xpx = xScale(nearest);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          
+          // Find data point for this step
+          const dataPoint = sortedData.find(d => d.step === nearest);
+          if (!dataPoint) return;
+          
+          // tooltip content
+          let html = `<div style="font-weight:800;letter-spacing:.1px;">Throughput Comparison</div><div style="font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;">Step ${formatK(nearest)}</div>`;
+          
+          series.forEach((s, i) => {
+            const value = s.name === 'Throughput (main run)' ? dataPoint.throughput_drops : dataPoint.throughput_no_drops;
+            html += `<div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><span class="d3-tooltip__color-dot" style="background:${colors[i % colors.length]}"></span><strong>${s.name}</strong><span style="margin-left:auto;">${formatThroughput(value)}</span></div>`;
+          });
+          
+          tipInner.innerHTML = html; 
+          tip.style.opacity = '1'; 
+          tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        
+        function onLeave(){ 
+          tip.style.opacity='0'; 
+          tip.style.transform='translate(-9999px, -9999px)'; 
+          hoverLine.style('display','none'); 
+        }
+        
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          // Try multiple possible paths for the CSV file
+          const csvPaths = [
+            '/data/throughput_drops_comparison_before_after.csv',
+            './assets/data/throughput_drops_comparison_before_after.csv',
+            '../assets/data/throughput_drops_comparison_before_after.csv',
+            '../../assets/data/throughput_drops_comparison_before_after.csv'
+          ];
+          
+          let csvText = null;
+          for (const path of csvPaths) {
+            try {
+              const response = await fetch(path, { cache: 'no-cache' });
+              if (response.ok) {
+                csvText = await response.text();
+                break;
+              }
+            } catch(_) {}
+          }
+          
+          if (!csvText) {
+            throw new Error('CSV file not found: throughput_drops_comparison_before_after.csv');
+          }
+          
+          const rows = d3.csvParse(csvText);
+          
+          // Parse the data
+          data = rows.map(d => ({
+            step: +d.Step,
+            throughput_drops: +d.throughput_drops,
+            throughput_no_drops: +d.throughput_no_drops
+          })).filter(d => !isNaN(d.step) && !isNaN(d.throughput_drops) && !isNaN(d.throughput_no_drops));
+          
+          // Initialize palette and listen for changes
+          refreshPalette();
+          document.addEventListener('palettes:updated', refreshPalette);
+          
+          render();
+          
+          const rerender = () => render();
+          if (window.ResizeObserver) { 
+            const ro = new ResizeObserver(() => rerender()); 
+            ro.observe(container); 
+          } else { 
+            window.addEventListener('resize', rerender); 
+          }
+        } catch (e) {
+          const pre = document.createElement('pre'); 
+          pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; 
+          pre.style.fontSize = '12px'; 
+          pre.style.whiteSpace = 'pre-wrap'; 
+          container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { 
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); 
+    } else { 
+      ensureD3(bootstrap); 
+    }
+  })();
+</script>
diff --git a/app/src/content/embeds/throughput-weka-drops.html b/app/src/content/embeds/throughput-weka-drops.html
new file mode 100644
index 0000000000000000000000000000000000000000..b66603fd84951ba6d45ffb84cb5c06c1f2fce947
--- /dev/null
+++ b/app/src/content/embeds/throughput-weka-drops.html
@@ -0,0 +1,283 @@
+<div class="throughput-weka-drops"></div>
+<style>
+  .throughput-weka-drops { position: relative; }
+  .throughput-weka-drops .axis-label { fill: var(--text-color); font-size: 12px; font-weight: 700; }
+  .throughput-weka-drops .axes path, .throughput-weka-drops .axes line { stroke: var(--axis-color); }
+  .throughput-weka-drops .axes text { fill: var(--tick-color); }
+  .throughput-weka-drops .grid line { stroke: var(--grid-color); }
+  .throughput-weka-drops .chart-card { background: var(--surface-bg); border: 1px solid var(--border-color); border-radius: 10px; padding: 8px; }
+  .throughput-weka-drops .chart-header { display:flex; align-items:flex-start; justify-content:flex-start; gap:12px; margin: 8px 0 0 0; flex-wrap: wrap; }
+  .throughput-weka-drops .legend-bottom { display:flex; align-items:center; justify-content:flex-start; font-size:12px; color: var(--text-color); }
+  .throughput-weka-drops .legend-bottom .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+  .throughput-weka-drops .legend-bottom .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; }
+  .throughput-weka-drops .legend-bottom .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); display:inline-block; }
+  .throughput-weka-drops .legend-bottom .legend-title { font-size: 12px; font-weight: 700; color: var(--text-color); }
+  .throughput-weka-drops .legend-bottom { flex-direction: column; align-items: flex-start; gap: 6px; }
+  .throughput-weka-drops .lines path.active { stroke-width: 3; }
+  .throughput-weka-drops .d3-tooltip { z-index: var(--z-elevated); backdrop-filter: saturate(1.12) blur(8px); }
+  .throughput-weka-drops .d3-tooltip__inner { display:flex; flex-direction:column; gap:6px; min-width: 220px; }
+  .throughput-weka-drops .d3-tooltip__inner > div:first-child { font-weight: 800; letter-spacing: 0.1px; margin-bottom: 0; }
+  .throughput-weka-drops .d3-tooltip__inner > div:nth-child(2) { font-size: 11px; color: var(--muted-color); display: block; margin-top: -4px; margin-bottom: 2px; letter-spacing: 0.1px; }
+  .throughput-weka-drops .d3-tooltip__color-dot { display:inline-block; width: 12px; height: 12px; border-radius: 3px; border: 1px solid var(--border-color); }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true }); if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('throughput-weka-drops'))){
+        const cs = Array.from(document.querySelectorAll('.throughput-weka-drops')).filter(el => !(el.dataset && el.dataset.mounted === 'true'));
+        container = cs[cs.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) { if (container.dataset.mounted === 'true') return; container.dataset.mounted = 'true'; }
+
+      // Tooltip
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, {
+          position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none',
+          padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)',
+          background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease'
+        });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // Header (legend) placed after the chart
+      const header = document.createElement('div'); header.className = 'chart-header';
+      const legendBottom = document.createElement('div'); legendBottom.className = 'legend-bottom'; header.appendChild(legendBottom);
+
+      // Chart card (SVG)
+      const card = document.createElement('div'); card.className = 'chart-card'; container.appendChild(card);
+      container.appendChild(header);
+      
+      // SVG
+      const svg = d3.select(card).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+      const gGrid = gRoot.append('g').attr('class','grid');
+      const gAxes = gRoot.append('g').attr('class','axes');
+      const gLines = gRoot.append('g').attr('class','lines');
+      const gPoints = gRoot.append('g').attr('class','points');
+      const overlay = gRoot.append('rect').attr('fill','transparent').style('cursor','crosshair');
+      const hoverLine = gRoot.append('line').attr('stroke-width',1).style('display','none');
+
+      // State/data
+      let width = 800, height = 480; const margin = { top: 16, right: 32, bottom: 44, left: 80 };
+      const xScale = d3.scaleLinear();
+      const yScale = d3.scaleLinear();
+      const lineGen = d3.line().x(d => xScale(d.step)).y(d => yScale(d.value));
+      let data = [];
+
+      // Colors - following guidelines to use ColorPalettes
+      let currentColor = 'var(--primary-color, #4e79a7)';
+      
+      function refreshPalette(){
+        try { 
+          if (window.ColorPalettes && typeof window.ColorPalettes.getColors === 'function') {
+            const colors = window.ColorPalettes.getColors('categorical', 1);
+            if (colors && colors.length > 0) {
+              currentColor = colors[0];
+              // Re-render with new colors
+              if (data.length > 0) render();
+              return;
+            }
+          }
+        } catch(_){}
+        // Fallback to CSS variable or default
+        currentColor = 'var(--primary-color, #4e79a7)';
+        // Re-render with fallback colors
+        if (data.length > 0) render();
+      }
+      
+      function getColor(){
+        return currentColor;
+      }
+      
+      // Format helper for thousands (5000 -> 5k, 1500 -> 1.5k)
+      function formatK(v){
+        const abs = Math.abs(v);
+        if (abs >= 1000) {
+          const n = v / 1000;
+          const s = d3.format('.1f')(n);
+          return (s.endsWith('.0') ? s.slice(0, -2) : s) + 'k';
+        }
+        return d3.format('d')(v);
+      }
+
+      // Format helper for throughput values
+      function formatThroughput(v){
+        if (v >= 1000) {
+          return d3.format('.1f')(v / 1000) + 'k';
+        }
+        return d3.format('.1f')(v);
+      }
+
+      function updateLayout(){
+        const axisColor = getComputedStyle(container).getPropertyValue('--axis-color').trim() || 'rgba(0,0,0,0.25)';
+        width = container.clientWidth || 800;
+        height = Math.max(280, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        const innerWidth = width - margin.left - margin.right;
+        const innerHeight = height - margin.top - margin.bottom;
+        overlay.attr('x',0).attr('y',0).attr('width', innerWidth).attr('height', innerHeight);
+        hoverLine.attr('y1',0).attr('y2', innerHeight).attr('stroke', axisColor);
+        return { innerWidth, innerHeight };
+      }
+
+      function render(){
+        if (data.length === 0) return;
+        
+        const { innerWidth, innerHeight } = updateLayout();
+        
+        // Sort data by step
+        const sortedData = data.slice().sort((a, b) => a.step - b.step);
+        
+        // domains
+        const minStep = d3.min(sortedData, d => d.step);
+        const maxStep = d3.max(sortedData, d => d.step);
+        const minValue = d3.min(sortedData, d => d.value);
+        const maxValue = d3.max(sortedData, d => d.value);
+        
+        xScale.domain([minStep, maxStep]).range([0, innerWidth]);
+        yScale.domain([minValue, maxValue]).nice().range([innerHeight, 0]);
+
+        // grid
+        gGrid.selectAll('*').remove();
+        gGrid.selectAll('line').data(yScale.ticks(6)).join('line')
+          .attr('x1',0).attr('x2', innerWidth).attr('y1', d=>yScale(d)).attr('y2', d=>yScale(d))
+          .attr('stroke','var(--grid-color)').attr('stroke-width',1).attr('shape-rendering','crispEdges');
+
+        // axes
+        gAxes.selectAll('*').remove();
+        gAxes.append('g').attr('transform', `translate(0,${innerHeight})`).call(d3.axisBottom(xScale).ticks(8).tickFormat(formatK)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('g').call(d3.axisLeft(yScale).ticks(6).tickFormat(formatThroughput)).call(g=>{ g.selectAll('path, line').attr('stroke','var(--axis-color)'); g.selectAll('text').attr('fill','var(--tick-color)').style('font-size','12px'); });
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('x', innerWidth/2).attr('y', innerHeight + 38).text('Training Step');
+        gAxes.append('text').attr('class','axis-label').attr('text-anchor','middle').attr('transform', `translate(${-60}, ${innerHeight/2}) rotate(-90)`).text('Tokens/sec/GPU');
+
+        // line
+        const color = getColor();
+        gLines.selectAll('*').remove();
+        gLines.append('path')
+          .attr('class','line')
+          .attr('fill','none')
+          .attr('stroke', color)
+          .attr('stroke-width', 2)
+          .attr('d', lineGen(sortedData));
+
+        // point markers
+        gPoints.selectAll('*').remove();
+        gPoints.selectAll('circle').data(sortedData).join('circle')
+          .attr('class','point')
+          .attr('r', 2)
+          .attr('fill', color)
+          .attr('fill-opacity', 0.6)
+          .attr('cx', d=>xScale(d.step))
+          .attr('cy', d=>yScale(d.value));
+
+        // legend
+        legendBottom.innerHTML = `<div class="legend-title">Throughput</div><div class="items"><span class="item"><span class="swatch" style="background:${color}"></span><span>Tokens/sec/GPU</span></span></div>`;
+
+        // hover
+        function onMove(ev){
+          const [mx, my] = d3.pointer(ev, overlay.node());
+          const sx = xScale.invert(mx);
+          
+          // Find nearest point
+          const nearest = sortedData.reduce((best, d) => Math.abs(d.step - sx) < Math.abs(best.step - sx) ? d : best, sortedData[0]);
+          const xpx = xScale(nearest.step);
+          hoverLine.style('display', null).attr('x1', xpx).attr('x2', xpx);
+          
+          // tooltip content
+          let html = `<div style="font-weight:800;letter-spacing:.1px;">Training Throughput</div><div style="font-size:11px;color:var(--muted-color);margin-top:-4px;margin-bottom:2px;">Step ${formatK(nearest.step)}</div>`;
+          html += `<div style="display:flex;align-items:center;gap:6px;white-space:nowrap;"><span class="d3-tooltip__color-dot" style="background:${color}"></span><strong>Tokens/sec/GPU</strong><span style="margin-left:auto;">${formatThroughput(nearest.value)}</span></div>`;
+          
+          tipInner.innerHTML = html; 
+          tip.style.opacity = '1'; 
+          tip.style.transform = `translate(${Math.round(mx + margin.left + 12)}px, ${Math.round(my + margin.top + 12)}px)`;
+        }
+        
+        function onLeave(){ 
+          tip.style.opacity='0'; 
+          tip.style.transform='translate(-9999px, -9999px)'; 
+          hoverLine.style('display','none'); 
+        }
+        
+        overlay.on('mousemove', onMove).on('mouseleave', onLeave);
+      }
+
+      // load CSV and init
+      (async () => {
+        try {
+          // Try multiple possible paths for the CSV file
+          const csvPaths = [
+            '/data/weka_drop_0404.csv',
+            './assets/data/weka_drop_0404.csv',
+            '../assets/data/weka_drop_0404.csv',
+            '../../assets/data/weka_drop_0404.csv'
+          ];
+          
+          let csvText = null;
+          for (const path of csvPaths) {
+            try {
+              const response = await fetch(path, { cache: 'no-cache' });
+              if (response.ok) {
+                csvText = await response.text();
+                break;
+              }
+            } catch(_) {}
+          }
+          
+          if (!csvText) {
+            throw new Error('CSV file not found: weka_drop_0404.csv');
+          }
+          
+          const rows = d3.csvParse(csvText);
+          
+          // Parse the data - use the second column (tokens_per_sec_per_gpu) and ignore min/max
+          data = rows.map(d => ({
+            step: +d.Step,
+            value: +d["04/04/2025_02:44:57_elie-smollm3-training-3p56G-smollm3-3B-start-0404-stage-1-wo-zloss-seed6-ddp-256-seed-6-_tp_group_1 - tokens_per_sec_per_gpu"]
+          })).filter(d => !isNaN(d.step) && !isNaN(d.value));
+          
+          // Initialize palette and listen for changes
+          refreshPalette();
+          document.addEventListener('palettes:updated', refreshPalette);
+          
+          render();
+          
+          const rerender = () => render();
+          if (window.ResizeObserver) { 
+            const ro = new ResizeObserver(() => rerender()); 
+            ro.observe(container); 
+          } else { 
+            window.addEventListener('resize', rerender); 
+          }
+        } catch (e) {
+          const pre = document.createElement('pre'); 
+          pre.textContent = 'CSV load error: ' + (e && e.message ? e.message : e);
+          pre.style.color = 'var(--danger, #b00020)'; 
+          pre.style.fontSize = '12px'; 
+          pre.style.whiteSpace = 'pre-wrap'; 
+          container.appendChild(pre);
+        }
+      })();
+    };
+
+    if (document.readyState === 'loading') { 
+      document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); 
+    } else { 
+      ensureD3(bootstrap); 
+    }
+  })();
+</script>
diff --git a/app/src/content/embeds/vibe-code-d3-embeds-directives.md b/app/src/content/embeds/vibe-code-d3-embeds-directives.md
new file mode 100644
index 0000000000000000000000000000000000000000..329833c8a753e2ee29aff29f8edd12da5d4481c8
--- /dev/null
+++ b/app/src/content/embeds/vibe-code-d3-embeds-directives.md
@@ -0,0 +1,504 @@
+## Embed Chart Authoring Guidelines
+
+### Quickstart (TL;DR)
+- Create a single self-contained HTML fragment: root div + scoped style + IIFE script.
+- Draw marks/axes in SVG; render UI (legend and controls) in HTML.
+- Place legend and controls BELOW the chart (header appended after the chart). Include a legend title "Legend" and a select labeled "Metric" when relevant.
+- Load data from public `/data` first, then fall back to `assets/data`.
+- Use `window.ColorPalettes` for colors; stick to CSS variables for theming.
+
+Minimal header markup:
+```html
+<div class="legend">
+  <div class="legend-title">Legend</div>
+  <div class="items"></div>
+  <!-- items populated by JS: <span class="item"><span class="swatch"></span><span>Name</span></span> -->
+</div>
+<div class="controls">
+  <div class="control-group">
+    <label for="metric-select-<id>">Metric</label>
+    <select id="metric-select-<id>"></select>
+  </div>
+  <!-- optional: other controls -->
+</div>
+```
+
+See also: `d3-line-simple.html`, `d3-line-quad.html`, `d3-benchmark.html`.
+
+Authoring rules for creating a new interactive chart as a single self-contained `.html` file under `src/content/embeds/`. These conventions are derived from `d3-bar.html`, `d3-comparison.html`, `d3-neural.html`, `d3-line.html`, and `d3-pie.html`.
+
+### A) Colors & palettes (MANDATORY)
+- Always obtain color arrays from `window.ColorPalettes`; do not hardcode palettes.
+- Use the categorical/sequential/diverging helpers and the current primary color.
+- If you change `--primary-color` dynamically, call `window.ColorPalettes.refresh()` so listeners update.
+
+Usage:
+```js
+// Usage (with explicit counts)
+const cat = window.ColorPalettes.getColors('categorical', 8);
+const seq = window.ColorPalettes.getColors('sequential', 8);
+const div = window.ColorPalettes.getColors('diverging', 7);
+
+// For current primary color string
+const primaryHex = window.ColorPalettes.getPrimary();
+
+// If you change --primary-color dynamically, call refresh to notify listeners
+document.documentElement.style.setProperty('--primary-color', '#6D4AFF');
+window.ColorPalettes.refresh();
+```
+
+Notes:
+- Keep chart accents (lines, markers, selection) aligned with `--primary-color`.
+- Prefer CSS variables for fills/strokes when possible; derive series colors via `ColorPalettes`.
+- Provide a graceful fallback to CSS variables if `window.ColorPalettes` is unavailable.
+
+### B) Layout & form elements (HTML-only)
+- All UI controls (labels, selects, sliders, buttons, toggles) must be plain HTML inside the root container.
+- Do not draw controls with SVG; style them consistently (rounded 8px, custom caret, focus ring).
+- Use `<label>` wrapping inputs for accessibility and concise text (e.g., "Metric", "Model Size").
+- Manage layout with CSS inside the scoped `<style>` for the root class; avoid global rules.
+
+### C) SVG scope: charts only; UI in HTML
+- SVG is for chart primitives (marks, axes, gridlines) only.
+- Put legends and controls in HTML (adjacent DOM is preferred; `foreignObject` only if necessary).
+- Tooltips are HTML positioned absolutely inside the root container.
+  - Details: see sections 4 (controls), 5 (tooltips), 8 (legends).
+
+### 1) File, naming, and structure
+- Name files with a clear prefix and purpose: `d3-<type>.html` (e.g., `d3-scatter.html`).
+- Wrap everything in a single `<div class="<root-class>">`, a `<style>` block scoped to that root class, and a `<script>` IIFE.
+- Do not leak globals; do not attach anything to `window`.
+- Use a unique, descriptive root class (e.g., `.d3-scatter`).
+
+Minimal skeleton:
+```html
+<div class="d3-yourchart"></div>
+<style>
+  .d3-yourchart {/* all styles scoped to the root */}
+</style>
+<script>
+  (() => {
+    // Optional dependency loader (e.g., D3)
+    const ensureD3 = (cb) => {
+      if (window.d3 && typeof window.d3.select === 'function') return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id = 'd3-cdn-script'; s.src = 'https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && typeof window.d3.select === 'function') cb(); };
+      s.addEventListener('load', onReady, { once: true });
+      if (window.d3) onReady();
+    };
+
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      // Prefer the closest previous sibling with the root class
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-yourchart'))) {
+        // Fallback: pick the last unmounted instance in the page
+        const candidates = Array.from(document.querySelectorAll('.d3-yourchart'))
+          .filter((el) => !(el.dataset && el.dataset.mounted === 'true'));
+        container = candidates[candidates.length - 1] || null;
+      }
+      if (!container) return;
+      if (container.dataset) {
+        if (container.dataset.mounted === 'true') return;
+        container.dataset.mounted = 'true';
+      }
+
+      // Tooltip (optional)
+      container.style.position = container.style.position || 'relative';
+      let tip = container.querySelector('.d3-tooltip'); let tipInner;
+      if (!tip) {
+        tip = document.createElement('div'); tip.className = 'd3-tooltip';
+        Object.assign(tip.style, { position:'absolute', top:'0px', left:'0px', transform:'translate(-9999px, -9999px)', pointerEvents:'none', padding:'8px 10px', borderRadius:'8px', fontSize:'12px', lineHeight:'1.35', border:'1px solid var(--border-color)', background:'var(--surface-bg)', color:'var(--text-color)', boxShadow:'0 4px 24px rgba(0,0,0,.18)', opacity:'0', transition:'opacity .12s ease' });
+        tipInner = document.createElement('div'); tipInner.className = 'd3-tooltip__inner'; tipInner.style.textAlign='left'; tip.appendChild(tipInner); container.appendChild(tip);
+      } else { tipInner = tip.querySelector('.d3-tooltip__inner') || tip; }
+
+      // SVG scaffolding (if using D3)
+      const svg = d3.select(container).append('svg').attr('width','100%').style('display','block');
+      const gRoot = svg.append('g');
+
+      // State & layout
+      let width = 800, height = 360; const margin = { top: 16, right: 28, bottom: 56, left: 64 };
+      function updateSize(){
+        const isDark = document.documentElement.getAttribute('data-theme') === 'dark';
+        width = container.clientWidth || 800;
+        height = Math.max(260, Math.round(width / 3));
+        svg.attr('width', width).attr('height', height);
+        gRoot.attr('transform', `translate(${margin.left},${margin.top})`);
+        return { innerWidth: width - margin.left - margin.right, innerHeight: height - margin.top - margin.bottom, isDark };
+      }
+
+      function render(){
+        const { innerWidth, innerHeight } = updateSize();
+        // ... draw/update your chart here using data joins
+      }
+
+      // Initial render + resize handling
+      render();
+      const rerender = () => render();
+      if (window.ResizeObserver) { const ro = new ResizeObserver(() => rerender()); ro.observe(container); }
+      else { window.addEventListener('resize', rerender); }
+    };
+
+    if (document.readyState === 'loading') { document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once: true }); }
+    else { ensureD3(bootstrap); }
+  })();
+</script>
+```
+
+### 2) Mounting and re-entrancy
+- Select the closest previous sibling with the root class; fallback to the last unmounted matching element in the document.
+- Gate with `data-mounted` to avoid double-initialization when the fragment re-runs.
+- Assume the chart can appear multiple times on the same page.
+
+### 3) Styling and theming
+- Scope all rules under the root class; do not style `body`, `svg` globally.
+- Use CSS variables for theme alignment: `--primary-color`, `--text-color`, `--muted-color`, `--surface-bg`, `--border-color`.
+- Derive palette colors from `window.ColorPalettes` (categorical, sequential, diverging); do not hardcode arrays.
+- For dark mode–aware strokes/ticks, either:
+  - Read `document.documentElement.getAttribute('data-theme') === 'dark'`, or
+  - Prefer CSS-only where possible.
+- Keep backgrounds light and borders subtle; the outer card frame is handled by `HtmlEmbed.astro`.
+
+Standard axis/tick/grid colors (global variables from `_variables.css`):
+
+```css
+/* Provided globally */
+:root {
+  --axis-color: var(--text-color);
+  --tick-color: var(--muted-color);
+  --grid-color: rgba(0,0,0,.08);
+}
+[data-theme="dark"] {
+  --axis-color: var(--text-color);
+  --tick-color: var(--muted-color);
+  --grid-color: rgba(255,255,255,.10);
+}
+/* Apply inside charts */
+.your-root-class .axes path,
+.your-root-class .axes line { stroke: var(--axis-color); }
+.your-root-class .axes text { fill: var(--tick-color); }
+.your-root-class .grid line { stroke: var(--grid-color); }
+```
+
+#### 3.1) Text on fixed-colored backgrounds
+
+- When rendering text over cells/areas with fixed background colors (that do not change with theme), compute a readable text style once from the actual background color.
+- Use `window.ColorPalettes.getTextStyleForBackground(bgCss, { blend: 0.6 })` when available; avoid tying text color to dark mode toggles since the background is constant.
+- Do not re-evaluate on theme toggle unless the background color itself changes.
+
+Example:
+```js
+const bg = getComputedStyle(cellRect).fill; // e.g., 'rgb(12, 34, 56)'
+const style = window.ColorPalettes?.getTextStyleForBackground
+  ? window.ColorPalettes.getTextStyleForBackground(bg, { blend: 0.6 })
+  : { fill: 'var(--text-color)' };
+textSel.style('fill', style.fill);
+```
+
+### 4) Controls (labels, selects, sliders)
+- Compose controls as plain HTML elements appended inside the root container (no SVG UI).
+- Style selects like in `d3-line.html`/`d3-bar.html` for consistency (rounded 8px, custom caret via data-URI, focus ring).
+- Use `<label>` wrapping the input for accessibility; set concise text (e.g., "Metric", "Model Size").
+
+#### 4.1) Required select label: "Metric"
+- When a select is used to switch metrics, include a visible label above the select with the exact text "Metric".
+- Preferred markup (grouped for easy vertical stacking):
+
+```html
+<div class="controls">
+  <div class="control-group">
+    <label for="metric-select-<unique>">Metric</label>
+    <select id="metric-select-<unique>"></select>
+  </div>
+</div>
+```
+
+Minimal CSS (match project styles):
+
+```css
+.controls { display:flex; gap:16px; align-items:center; justify-content:flex-end; flex-wrap:wrap; }
+.controls .control-group { display:flex; flex-direction:column; align-items:flex-start; gap:6px; }
+.controls label { font-size:12px; font-weight:700; color: var(--text-color); }
+.controls select { font-size:12px; padding:8px 28px 8px 10px; border:1px solid var(--border-color); border-radius:8px; background: var(--surface-bg); color: var(--text-color); }
+```
+
+### 5) Tooltip pattern
+- Create a single `.d3-tooltip` absolutely positioned inside the container.
+- Show on hover, hide on leave; position using `d3.pointer(event, container)` plus a small offset.
+- Keep content in a `.d3-tooltip__inner` node; avoid large inner HTML.
+
+### 6) Data loading
+- Prefer public assets first, then fall back to content assets:
+  - Example CSV paths: `/data/<file>.csv`, then `./assets/data/<file>.csv`, `../assets/data/<file>.csv`, etc.
+- Implement `fetchFirstAvailable(paths)`; try in order with `cache:'no-cache'`; handle errors gracefully with a red `<pre>` message.
+- For images or JSON models, mirror the same approach (see `d3-comparison.html`, `d3-neural.html`).
+
+#### 6.1) Data props (HtmlEmbed → embed)
+
+- HtmlEmbed accepts an optional `data` prop that can be a string (single file) or an array of strings (multiple files).
+- This prop is passed to the fragment via the `data-datafiles` HTML attribute.
+- In the embed script, read this attribute from the closest ancestor that carries it (the `HtmlEmbed` wrapper), not necessarily the chart’s direct container.
+- Recommended normalization: if a value contains no slash, automatically prefix it with `/data/` to target the public data folder.
+- If `data` is not provided, keep the usual fallback (public, then `assets/data`).
+
+Optional configuration (e.g., default metric):
+
+```js
+// In HtmlEmbed usage (MDX):
+<HtmlEmbed src="d3-line-simple.html" data="internal_deduplication.csv" config={{ defaultMetric: 'average_rank' }} />
+
+// In the embed script (read from closest ancestor):
+let mountEl = container;
+while (mountEl && !mountEl.getAttribute?.('data-datafiles') && !mountEl.getAttribute?.('data-config')) {
+  mountEl = mountEl.parentElement;
+}
+let providedConfig = null;
+try {
+  const cfg = mountEl && mountEl.getAttribute ? mountEl.getAttribute('data-config') : null;
+  if (cfg && cfg.trim()) providedConfig = cfg.trim().startsWith('{') ? JSON.parse(cfg) : cfg;
+} catch(_) {}
+// Example: selecting initial metric if present
+const desired = providedConfig && providedConfig.defaultMetric ? String(providedConfig.defaultMetric) : null;
+```
+
+Examples (MDX):
+
+```mdx
+<HtmlEmbed src="d3-line-simple.html" title="Run A" data="formatting_filters.csv" />
+<HtmlEmbed src="d3-line-simple.html" title="Run B" data="relevance_filters.csv" />
+
+<HtmlEmbed
+  src="d3-line-simple.html"
+  title="Comparison A vs B"
+  data={[ 'formatting_filters.csv', 'relevance_filters.csv' ]}
+/>
+```
+
+Reading on the embed side (JS):
+
+```js
+// Find the closest ancestor that carries the attribute
+let mountEl = container;
+while (mountEl && !mountEl.getAttribute?.('data-datafiles')) {
+  mountEl = mountEl.parentElement;
+}
+let providedData = null;
+try {
+  const attr = mountEl && mountEl.getAttribute ? mountEl.getAttribute('data-datafiles') : null;
+  if (attr && attr.trim()) {
+    providedData = attr.trim().startsWith('[') ? JSON.parse(attr) : attr.trim();
+  }
+} catch(_) {}
+
+const DEFAULT_CSV = '/data/formatting_filters.csv';
+const ensureDataPrefix = (p) => (typeof p === 'string' && p && !p.includes('/')) ? `/data/${p}` : p;
+const normalizeInput = (inp) => Array.isArray(inp)
+  ? inp.map(ensureDataPrefix)
+  : (typeof inp === 'string' ? [ ensureDataPrefix(inp) ] : null);
+
+const CSV_PATHS = Array.isArray(providedData)
+  ? normalizeInput(providedData)
+  : (typeof providedData === 'string' ? normalizeInput(providedData) || [DEFAULT_CSV] : [
+      DEFAULT_CSV,
+      './assets/data/formatting_filters.csv',
+      '../assets/data/formatting_filters.csv',
+      '../../assets/data/formatting_filters.csv'
+    ]);
+
+const fetchFirstAvailable = async (paths) => {
+  for (const p of paths) {
+    try {
+      const r = await fetch(p, { cache: 'no-cache' });
+      if (r.ok) return await r.text();
+    } catch(_){}
+  }
+  throw new Error('CSV not found');
+};
+```
+
+### 7) Responsiveness and layout
+- Compute `width = container.clientWidth`, and a height derived from width (e.g., `width / 3`), with a sensible minimum height.
+- Maintain a `margin` object and derive `innerWidth/innerHeight` for plots.
+- Use a `ResizeObserver` on the container; fallback to `window.resize`.
+- Recompute scales/axes/grid on every render.
+
+### 8) Legends and labels
+- Prefer HTML for legends for wrapping and accessibility; avoid SVG-based legends.
+- Always add axis labels when applicable (e.g., `Step`, `Value`).
+- Standardize legend swatch size: 14×14px, border-radius 3px, 1px border `var(--border-color)`.
+
+#### 8.1) Required legend title: "Legend"
+- Always render a visible title above legend items with the exact text "Legend".
+- Canonical markup:
+
+```html
+<div class="legend">
+  <div class="legend-title">Legend</div>
+  <div class="items">
+    <!-- <span class="item"><span class="swatch"></span><span>Series A</span></span> ... -->
+  </div>
+</div>
+```
+
+Minimal CSS (match project styles):
+
+```css
+.legend { display:flex; flex-direction:column; align-items:flex-start; gap:6px; }
+.legend-title { font-size:12px; font-weight:700; color: var(--text-color); }
+.legend .items { display:flex; flex-wrap:wrap; gap:8px 14px; }
+.legend .item { display:inline-flex; align-items:center; gap:6px; white-space:nowrap; font-size:12px; color: var(--text-color); }
+.legend .swatch { width:14px; height:14px; border-radius:3px; border:1px solid var(--border-color); }
+```
+
+Recommended JS pattern to (re)build the legend:
+
+```js
+function makeLegend(seriesNames, colorFor) {
+  let legend = container.querySelector('.legend');
+  if (!legend) { legend = document.createElement('div'); legend.className = 'legend'; container.appendChild(legend); }
+  let title = legend.querySelector('.legend-title'); if (!title) { title = document.createElement('div'); title.className = 'legend-title'; title.textContent = 'Legend'; legend.appendChild(title); }
+  let items = legend.querySelector('.items'); if (!items) { items = document.createElement('div'); items.className = 'items'; legend.appendChild(items); }
+  items.innerHTML = '';
+  seriesNames.forEach(name => {
+    const el = document.createElement('span'); el.className = 'item';
+    const sw = document.createElement('span'); sw.className = 'swatch'; sw.style.background = colorFor(name);
+    const txt = document.createElement('span'); txt.textContent = name;
+    el.appendChild(sw); el.appendChild(txt); items.appendChild(el);
+  });
+}
+```
+
+### 9) Accessibility
+- Provide `alt` attributes on `<img>` (see `d3-comparison.html`).
+- Provide `aria-label` on interactive buttons (e.g., the erase button in `d3-neural.html`).
+- Ensure focus-visible styles for interactive controls; avoid relying on color alone to encode meaning.
+
+### 10) Performance and updates
+- Use D3 data joins (`.data().join()` or explicit enter/merge/exit) and keep transitions short (≤200ms).
+- Recompute only what is necessary on each render; avoid repeated DOM clears if not needed.
+- Debounce or gate expensive computations, especially on `mousemove`.
+
+### 11) External dependencies
+- Load D3 (and optional TFJS) via CDN only once using an element id (e.g., `d3-cdn-script`, `tfjs-cdn-script`).
+- After `.load`, verify the expected API (e.g., `window.d3.select`).
+- Prefer pure D3 and built-ins; do not introduce new runtime dependencies unless necessary.
+
+### 12) Error handling and fallbacks
+- Fail gracefully: append a small `<pre>` with a readable message inside the container.
+- For optional models (e.g., TFJS), attempt multiple URLs and fall back to a heuristic if load fails.
+
+### 13) Printing
+- Favor vector (`svg`) or simple shapes; avoid large bitmap backgrounds.
+- Let `HtmlEmbed.astro` handle most print constraints; ensure the chart scales with width 100% and auto height.
+
+### 14) Conventions checklist (before committing)
+- Root class is unique and matches file name (`d3-<type>`).
+- No globals added; script wrapped in an IIFE.
+- `data-mounted` guard is present to avoid double-mount.
+- Colors come from `window.ColorPalettes` (no hardcoded arrays); `--primary-color` respected.
+- Uses CSS variables for colors; dark-mode friendly.
+- Responsive: recomputes layout on resize; uses `ResizeObserver`.
+- Controls are HTML-only, accessible, and consistently styled.
+- Legends and tooltips are HTML, not SVG.
+- Data loading includes public-path-first strategy and graceful error.
+- Axes/labels are legible at small widths.
+- Code is easy to skim: clear naming, early returns, short functions.
+
+### 14.1) Agent Checklist (operational)
+- Ensure root: one `<div .d3-xyz>` + scoped `<style>` + IIFE `<script>`
+- Gate mount with `data-mounted` and select closest previous sibling instance
+- Load D3 once via `#d3-cdn-script`; verify `window.d3.select`
+- Colors from `window.ColorPalettes` with CSS variable fallbacks
+- Legend present with visible title “Legend”; HTML-based, not SVG
+- Controls in HTML only; if metric select exists, label text must be “Metric”
+- Tooltip is a single absolute `.d3-tooltip` within the container
+- Data load public-first; implement `fetchFirstAvailable([...])` with `cache:'no-cache'`
+- Read optional HtmlEmbed `data-datafiles` and `data-config` per section 6.1
+- Responsiveness: width from container; `ResizeObserver` fallback to `window.resize`
+- Axis/tick/grid use CSS variables (`--axis-color`, `--tick-color`, `--grid-color`)
+- SVG for marks only; UI/legend/controls in HTML
+- No globals leaked; no external runtime deps besides D3/TFJS when necessary
+- Error path: append small red `<pre>` with a readable message inside container
+- Print-friendly: `svg` width 100%, height responsive, avoid heavy bitmaps
+
+### 14.2) Definition of Done (DoD)
+- Implements root structure and mounting guard
+- Uses `ColorPalettes` (with safe fallback) and CSS variables for theming
+- Legend with title “Legend” and consistent swatch style (14×14, r=3, 1px border)
+- Metric select labelled “Metric” when present; accessible markup (`<label for>`)
+- Tooltip works (show on hover, hide on leave, positioned via `d3.pointer`)
+- Public-first data loading + HtmlEmbed prop support when applicable
+- Responsive: resizes smoothly; axes and grid legible at small widths
+- No console errors; graceful error message on load failures
+- File is self‑contained; no globals; lints pass
+
+### 14.3) Prompt modèle (for the agent)
+```markdown
+You are implementing a self-contained D3 embed fragment.
+Name: d3-<type>.html (root class .d3-<type>)
+Requirements:
+- One root div + scoped style + IIFE script; no globals
+- UI in HTML (legend+controls), chart primitives in SVG
+- Legend title text exactly “Legend”; swatch 14×14, r=3, 1px border
+- If a select toggles metrics, visible label text exactly “Metric”
+- Colors via window.ColorPalettes (categorical/sequential/diverging), fallback to CSS variables or Tableau10
+- Tooltip: single .d3-tooltip inside container, HTML, positioned via d3.pointer
+- Data loading: try `/data/<file>` first, then `./assets/data/<file>`, `../assets/data/<file>`; implement fetchFirstAvailable(paths)
+- Read optional HtmlEmbed attributes `data-datafiles` and `data-config` if present (see section 6.1)
+- Responsiveness: compute width from container, use ResizeObserver; axis/tick/grid via CSS vars
+- Error handling: append small red <pre> inside container on failure
+Deliver one .html file with only the required elements.
+```
+
+### 15) Example: small bar chart (structure only)
+```html
+<div class="d3-mini-bar"></div>
+<style>
+  .d3-mini-bar .bar { stroke: none; }
+</style>
+<script>
+  (() => {
+    const ensureD3 = (cb) => {
+      if (window.d3 && d3.select) return cb();
+      let s = document.getElementById('d3-cdn-script');
+      if (!s) { s = document.createElement('script'); s.id='d3-cdn-script'; s.src='https://cdn.jsdelivr.net/npm/d3@7/dist/d3.min.js'; document.head.appendChild(s); }
+      const onReady = () => { if (window.d3 && d3.select) cb(); };
+      s.addEventListener('load', onReady, { once:true }); if (window.d3) onReady();
+    };
+    const bootstrap = () => {
+      const scriptEl = document.currentScript;
+      let container = scriptEl ? scriptEl.previousElementSibling : null;
+      if (!(container && container.classList && container.classList.contains('d3-mini-bar'))){
+        const cs = Array.from(document.querySelectorAll('.d3-mini-bar')).filter(el => !(el.dataset && el.dataset.mounted==='true'));
+        container = cs[cs.length-1] || null;
+      }
+      if (!container) return;
+      if (container.dataset){ if (container.dataset.mounted==='true') return; container.dataset.mounted='true'; }
+
+      const svg = d3.select(container).append('svg').attr('width','100%').style('display','block');
+      const g = svg.append('g');
+      let width=800,height=280; const margin={top:16,right:16,bottom:40,left:40};
+      const x=d3.scaleBand().padding(0.2), y=d3.scaleLinear();
+      const data=[{k:'A',v:3},{k:'B',v:7},{k:'C',v:5}];
+
+      function render(){
+        width = container.clientWidth || 800; height = Math.max(220, Math.round(width/3.2));
+        svg.attr('width', width).attr('height', height);
+        g.attr('transform',`translate(${margin.left},${margin.top})`);
+        const iw=width-margin.left-margin.right, ih=height-margin.top-margin.bottom;
+        x.domain(data.map(d=>d.k)).range([0,iw]); y.domain([0, d3.max(data,d=>d.v)||1]).range([ih,0]).nice();
+        const bars=g.selectAll('rect.bar').data(data);
+        bars.join('rect').attr('class','bar').attr('x',d=>x(d.k)).attr('y',d=>y(d.v)).attr('width',x.bandwidth()).attr('height',d=>Math.max(0.5, ih - y(d.v))).attr('fill','var(--primary-color)');
+        g.selectAll('.x').data([0]).join('g').attr('class','x').attr('transform',`translate(0,${ih})`).call(d3.axisBottom(x));
+        g.selectAll('.y').data([0]).join('g').attr('class','y').call(d3.axisLeft(y).ticks(5));
+      }
+      render();
+      const ro = window.ResizeObserver ? new ResizeObserver(() => render()) : null; if (ro) ro.observe(container); else window.addEventListener('resize', render);
+    };
+    if (document.readyState==='loading'){ document.addEventListener('DOMContentLoaded', () => ensureD3(bootstrap), { once:true }); } else { ensureD3(bootstrap); }
+  })();
+</script>
+```
+
+
diff --git a/app/src/styles/global.css b/app/src/styles/global.css
index 2e94501842520ae0c5d7200040a0a592c057f4bf..42d91c93a8fb952b562f0e1a455e13b03f8de310 100644
--- a/app/src/styles/global.css
+++ b/app/src/styles/global.css
@@ -8,7 +8,7 @@
 @import './components/_table.css';
 @import './components/_tag.css';
 @import './components/_card.css';
-@import './components/_form.css'; 
+@import './components/_form.css';
 
 .demo-wide,
 .demo-full-width {
@@ -27,6 +27,10 @@
 }
 
 .mermaid {
-    background: none!important;
-    margin-bottom: var(--block-spacing-y) !important;
+  background: none !important;
+  margin-bottom: var(--block-spacing-y) !important;
+}
+
+.katex .tag {
+  display: none;
 }
\ No newline at end of file