diff --git "a/flash_attn/results/combined_results.html" "b/flash_attn/results/combined_results.html"
--- "a/flash_attn/results/combined_results.html"
+++ "b/flash_attn/results/combined_results.html"
@@ -719,6 +719,41 @@
         .artifact-preview svg {
             background: transparent;
         }
+        /* CSV table styling */
+        .artifact-csv {
+            margin-top: 1rem;
+            overflow-x: auto;
+        }
+        .csv-table {
+            width: 100%;
+            border-collapse: collapse;
+            font-size: 0.9rem;
+            background: var(--bg-secondary);
+            border: 1px solid var(--border-primary);
+            border-radius: 1px;
+        }
+        .csv-table th,
+        .csv-table td {
+            padding: 0.5rem 0.75rem;
+            text-align: left;
+            border: 1px solid var(--border-primary);
+        }
+        .csv-table th {
+            background: var(--bg-tertiary);
+            font-weight: 600;
+            color: var(--text-primary);
+        }
+        .csv-table tbody tr:hover {
+            background: var(--bg-artifact-hover);
+        }
+        .artifact-csv-error {
+            margin-top: 1rem;
+            padding: 1rem;
+            background: var(--bg-error);
+            color: var(--text-error);
+            border: 1px solid var(--border-error);
+            border-radius: 1px;
+        }
         .cell-failed {
             border-color: var(--border-cell-failed);
         }
@@ -1073,6 +1108,159 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
     overflow: scroll;
     max-height: 300px;
 }
+svg {
+    max-width: 100%;
+    height: auto;
+    cursor: crosshair;
+}
+
+/* Hover effects for series lines */
+.series path {
+    stroke-width: 6 !important; /* make lines easier to hover */
+    transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
+    filter: drop-shadow(0 2px 4px rgba(0, 0, 0, 0.1));
+}
+
+/* remove border on focus */
+g:focus {
+    outline: none !important;
+}
+
+.series:hover path {
+    stroke-width: 3;
+    filter: drop-shadow(0 4px 8px rgba(0, 0, 0, 0.2));
+    /* transform: translateY(-1px); */
+}
+
+.series:hover circle {
+    r: 5;
+    filter: drop-shadow(0 2px 6px rgba(0, 0, 0, 0.3));
+}
+
+/* Individual series hover colors with glow */
+#series--torch-flash-ma:hover path {
+    stroke: #0066cc;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #1f77b4);
+}
+
+#series--torch-mem-eff:hover path {
+    stroke: #ff6600;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #ff7f0e);
+}
+
+#series--xformers-meff:hover path {
+    stroke: #228833;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #2ca02c);
+}
+
+#series--torch-flash-compiled-default:hover path {
+    stroke: #cc0000;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #d62728);
+}
+
+#series--torch-flash-compiled-max-autotune:hover path {
+    stroke: #7733aa;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #9467bd);
+}
+
+#series--hf-kernels-flash-attn:hover path {
+    stroke: #664422;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #8c564b);
+}
+
+#series--hf-kernels-flash-attn3:hover path {
+    stroke: #cc3399;
+    stroke-width: 4;
+    filter: drop-shadow(0 0 8px #e377c2);
+}
+
+/* Cursor changes */
+.series {
+    cursor: pointer;
+}
+
+.series:hover {
+    cursor: pointer;
+}
+
+/* Tooltip styles */
+.tooltip {
+    position: absolute;
+    background: rgba(0, 0, 0, 0.9);
+    color: white;
+    padding: 12px 16px;
+    border-radius: 8px;
+    font-size: 14px;
+    font-weight: 500;
+    pointer-events: none;
+    opacity: 0;
+    transition: opacity 0.3s ease;
+    z-index: 1000;
+    backdrop-filter: blur(10px);
+    border: 1px solid rgba(255, 255, 255, 0.2);
+    box-shadow: 0 8px 16px rgba(0, 0, 0, 0.3);
+}
+
+.tooltip.show {
+    opacity: 1;
+}
+
+/* Legend hover effects */
+.legend g:hover text {
+    font-weight: bold;
+    fill: #333;
+}
+
+.legend g {
+    cursor: pointer;
+    transition: all 0.2s ease;
+}
+
+.legend g:hover {
+    transform: translateX(5px);
+}
+
+/* Subtle animations */
+@keyframes pulse {
+    0%, 100% { opacity: 1; }
+    50% { opacity: 0.7; }
+}
+
+.series:active path {
+    animation: pulse 0.3s ease;
+}
+
+/* Responsive design */
+@media (max-width: 768px) {
+    .chart-container {
+        padding: 15px;
+        margin: 10px;
+    }
+}
+
+/* Loading animation */
+.chart-container::before {
+    content: '';
+    position: absolute;
+    top: 0;
+    left: 0;
+    right: 0;
+    bottom: 0;
+    background: linear-gradient(90deg, transparent, rgba(255,255,255,0.4), transparent);
+    transform: translateX(-100%);
+    animation: shimmer 2s ease-in-out;
+}
+
+@keyframes shimmer {
+    0% { transform: translateX(-100%); }
+    100% { transform: translateX(100%); }
+}
 
         
         
@@ -3718,20 +3906,1192 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
         <h1>Flash Attention Benchmarks - Aggregated Results</h1>
 <p>This document combines benchmark results from multiple attention implementations
 using cross-file dependencies.</p>
-<h2>Combined Summary and Visualization</h2>
+<h2>Combined Summary and Visualization&gt;</h2>
+<div class="artifact-preview">
+<?xml version='1.0' encoding='utf-8'?>
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:ns2="http://creativecommons.org/ns#" xmlns:ns4="http://www.w3.org/1999/xlink" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" width="864pt" height="576pt" viewBox="0 0 864 576" version="1.1">
+ <metadata>
+  <rdf:RDF>
+   <ns2:Work>
+    <dc:type rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+    <dc:date>2025-10-02T18:12:57.416034</dc:date>
+    <dc:format>image/svg+xml</dc:format>
+    <dc:creator>
+     <ns2:Agent>
+      <dc:title>Matplotlib v3.10.6, https://matplotlib.org/</dc:title>
+     </ns2:Agent>
+    </dc:creator>
+   </ns2:Work>
+  </rdf:RDF>
+ </metadata>
+ <defs>
+  <style type="text/css">*{stroke-linejoin: round; stroke-linecap: butt}</style>
+ </defs>
+ <g id="figure--latency" class="figure">
+  <g id="patch_1">
+   <path d="M 0 576  L 864 576  L 864 0  L 0 0  L 0 576  z " style="fill: none" />
+  </g>
+  <g id="axes--1" class="axes">
+   <g id="patch_2">
+    <path d="M 47.72 502.746298  L 853.2 502.746298  L 853.2 26.88  L 47.72 26.88  L 47.72 502.746298  z " style="fill: none" />
+   </g>
+   <g id="matplotlib.axis_1">
+    <g id="xtick_1">
+     <g id="grid-x--1" class="grid grid-x">
+      <path d="M 84.332727 502.746298  L 84.332727 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_1">
+      <defs>
+       <path id="mafb3703e5b" d="M 0 0  L 0 3.5  " style="stroke: #000000; stroke-width: 0.8" />
+      </defs>
+      <g>
+       <use ns4:href="#mafb3703e5b" x="84.332727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_1">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(69.139323 549.211696) rotate(-45)">flux_L128</text>
+     </g>
+    </g>
+    <g id="xtick_2">
+     <g id="grid-x--2" class="grid grid-x">
+      <path d="M 230.783636 502.746298  L 230.783636 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_2">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="230.783636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_2">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(215.590232 549.211696) rotate(-45)">flux_L256</text>
+     </g>
+    </g>
+    <g id="xtick_3">
+     <g id="grid-x--3" class="grid grid-x">
+      <path d="M 377.234545 502.746298  L 377.234545 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_3">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="377.234545" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_3">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(362.041141 549.211696) rotate(-45)">flux_L320</text>
+     </g>
+    </g>
+    <g id="xtick_4">
+     <g id="grid-x--4" class="grid grid-x">
+      <path d="M 523.685455 502.746298  L 523.685455 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_4">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="523.685455" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_4">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(508.49205 549.211696) rotate(-45)">flux_L384</text>
+     </g>
+    </g>
+    <g id="xtick_5">
+     <g id="grid-x--5" class="grid grid-x">
+      <path d="M 670.136364 502.746298  L 670.136364 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_5">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="670.136364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_5">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(654.942959 549.211696) rotate(-45)">flux_L448</text>
+     </g>
+    </g>
+    <g id="xtick_6">
+     <g id="grid-x--6" class="grid grid-x">
+      <path d="M 816.587273 502.746298  L 816.587273 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_6">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="816.587273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_6">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.393868 549.211696) rotate(-45)">flux_L512</text>
+     </g>
+    </g>
+    <g id="label--x" class="xlabel">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="562.477358" transform="rotate(-0 450.46 562.477358)">Workload</text>
+    </g>
+   </g>
+   <g id="matplotlib.axis_2">
+    <g id="ytick_1">
+     <g id="grid-y--2" class="grid grid-y">
+      <path d="M 47.72 441.595518  L 853.2 441.595518  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_7">
+      <defs>
+       <path id="m0fca2865ba" d="M 0 0  L -3.5 0  " style="stroke: #000000; stroke-width: 0.8" />
+      </defs>
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="441.595518" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_7">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="445.394736" transform="rotate(-0 40.72 445.394736)">0.4</text>
+     </g>
+    </g>
+    <g id="ytick_2">
+     <g id="grid-y--3" class="grid grid-y">
+      <path d="M 47.72 370.372038  L 853.2 370.372038  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_8">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="370.372038" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_8">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="374.171257" transform="rotate(-0 40.72 374.171257)">0.5</text>
+     </g>
+    </g>
+    <g id="ytick_3">
+     <g id="grid-y--4" class="grid grid-y">
+      <path d="M 47.72 299.148559  L 853.2 299.148559  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_9">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="299.148559" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_9">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="302.947777" transform="rotate(-0 40.72 302.947777)">0.6</text>
+     </g>
+    </g>
+    <g id="ytick_4">
+     <g id="grid-y--5" class="grid grid-y">
+      <path d="M 47.72 227.925079  L 853.2 227.925079  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_10">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="227.925079" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_10">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="231.724298" transform="rotate(-0 40.72 231.724298)">0.7</text>
+     </g>
+    </g>
+    <g id="ytick_5">
+     <g id="grid-y--6" class="grid grid-y">
+      <path d="M 47.72 156.7016  L 853.2 156.7016  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_11">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="156.7016" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_11">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="160.500818" transform="rotate(-0 40.72 160.500818)">0.8</text>
+     </g>
+    </g>
+    <g id="ytick_6">
+     <g id="grid-y--7" class="grid grid-y">
+      <path d="M 47.72 85.47812  L 853.2 85.47812  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_12">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="85.47812" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_12">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="89.277339" transform="rotate(-0 40.72 89.277339)">0.9</text>
+     </g>
+    </g>
+    <g id="label--y" class="ylabel">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.737188" y="264.813149" transform="rotate(-90 18.737188 264.813149)">Latency P50 (ms)</text>
+    </g>
+   </g>
+   <g id="series--torch-flash-ma" class="series">
+    <path d="M 84.332727 384.366017  L 230.783636 354.076093  L 377.234545 262.910067  L 523.685455 241.554421  L 670.136364 219.241513  L 816.587273 200.575276  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="md7efaf3aec" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #1f77b4" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#md7efaf3aec" x="84.332727" y="384.366017" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="230.783636" y="354.076093" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="377.234545" y="262.910067" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="523.685455" y="241.554421" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="670.136364" y="219.241513" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="816.587273" y="200.575276" style="fill: #1f77b4; stroke: #1f77b4" />
+    </g>
+   </g>
+   <g id="series--torch-mem-eff" class="series">
+    <path d="M 84.332727 308.082841  L 230.783636 260.858805  L 377.234545 171.903535  L 523.685455 162.057611  L 670.136364 123.220874  L 816.587273 48.510286  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m9b8c54d372" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #ff7f0e" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m9b8c54d372" x="84.332727" y="308.082841" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="230.783636" y="260.858805" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="377.234545" y="171.903535" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="523.685455" y="162.057611" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="670.136364" y="123.220874" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="816.587273" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
+    </g>
+   </g>
+   <g id="series--xformers-meff" class="series">
+    <path d="M 84.332727 406.542164  L 230.783636 391.317445  L 377.234545 297.598728  L 523.685455 298.875063  L 670.136364 270.340104  L 816.587273 266.214825  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="mc655281e0b" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #2ca02c" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#mc655281e0b" x="84.332727" y="406.542164" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="230.783636" y="391.317445" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="377.234545" y="297.598728" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="523.685455" y="298.875063" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="670.136364" y="270.340104" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="816.587273" y="266.214825" style="fill: #2ca02c; stroke: #2ca02c" />
+    </g>
+   </g>
+   <g id="series--torch-flash-compiled-default" class="series">
+    <path d="M 84.332727 350.930872  L 230.783636 329.666414  L 377.234545 237.884954  L 523.685455 216.392568  L 670.136364 197.908664  L 816.587273 174.798074  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m61c8040d7e" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #d62728" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m61c8040d7e" x="84.332727" y="350.930872" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="230.783636" y="329.666414" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="377.234545" y="237.884954" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="523.685455" y="216.392568" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="670.136364" y="197.908664" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="816.587273" y="174.798074" style="fill: #d62728; stroke: #d62728" />
+    </g>
+   </g>
+   <g id="series--torch-flash-compiled-max-autotune" class="series">
+    <path d="M 84.332727 277.998026  L 230.783636 240.665551  L 377.234545 144.963984  L 523.685455 121.192408  L 670.136364 83.290135  L 816.587273 73.786081  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m7cd35be9cc" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #9467bd" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m7cd35be9cc" x="84.332727" y="277.998026" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="230.783636" y="240.665551" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="377.234545" y="144.963984" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="523.685455" y="121.192408" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="670.136364" y="83.290135" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="816.587273" y="73.786081" style="fill: #9467bd; stroke: #9467bd" />
+    </g>
+   </g>
+   <g id="series--hf-kernels-flash-attn" class="series">
+    <path d="M 84.332727 481.116012  L 230.783636 458.415662  L 377.234545 375.272203  L 523.685455 360.207041  L 670.136364 345.438113  L 816.587273 331.284576  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m5dea31a887" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #8c564b" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m5dea31a887" x="84.332727" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="230.783636" y="458.415662" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="377.234545" y="375.272203" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="523.685455" y="360.207041" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="670.136364" y="345.438113" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="816.587273" y="331.284576" style="fill: #8c564b; stroke: #8c564b" />
+    </g>
+   </g>
+   <g id="series--hf-kernels-flash-attn3" class="series">
+    <path d="M 84.332727 468.876956  L 230.783636 448.319013  L 377.234545 353.939354  L 523.685455 352.571874  L 670.136364 323.831785  L 816.587273 320.754912  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m67b69c36d7" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #e377c2" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m67b69c36d7" x="84.332727" y="468.876956" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="230.783636" y="448.319013" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="377.234545" y="353.939354" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="523.685455" y="352.571874" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="670.136364" y="323.831785" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="816.587273" y="320.754912" style="fill: #e377c2; stroke: #e377c2" />
+    </g>
+   </g>
+   <g id="patch_3">
+    <path d="M 47.72 502.746298  L 47.72 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_4">
+    <path d="M 853.2 502.746298  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_5">
+    <path d="M 47.72 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_6">
+    <path d="M 47.72 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="text_13">
+    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="20.88" transform="rotate(-0 450.46 20.88)">Attention Implementation Latency</text>
+   </g>
+   <g id="legend" class="legend">
+    <g id="patch_7">
+     <path d="M 54.72 139.57375  L 269.259063 139.57375  Q 271.259063 139.57375 271.259063 137.57375  L 271.259063 33.88  Q 271.259063 31.88 269.259063 31.88  L 54.72 31.88  Q 52.72 31.88 52.72 33.88  L 52.72 137.57375  Q 52.72 139.57375 54.72 139.57375  L 54.72 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
+    </g>
+    <g id="line2d_13">
+     <path d="M 56.72 39.978438  L 66.72 39.978438  L 76.72 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#md7efaf3aec" x="66.72" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-ma" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="43.478438" transform="rotate(-0 84.72 43.478438)">torch_flash_ma</text>
+    </g>
+    <g id="line2d_14">
+     <path d="M 56.72 54.934687  L 66.72 54.934687  L 76.72 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m9b8c54d372" x="66.72" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     </g>
+    </g>
+    <g id="legend-label--torch-mem-eff" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="58.434687" transform="rotate(-0 84.72 58.434687)">torch_mem_eff</text>
+    </g>
+    <g id="line2d_15">
+     <path d="M 56.72 69.890938  L 66.72 69.890938  L 76.72 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#mc655281e0b" x="66.72" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
+     </g>
+    </g>
+    <g id="legend-label--xformers-meff" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="73.390938" transform="rotate(-0 84.72 73.390938)">xformers_meff</text>
+    </g>
+    <g id="line2d_16">
+     <path d="M 56.72 84.847188  L 66.72 84.847188  L 76.72 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m61c8040d7e" x="66.72" y="84.847188" style="fill: #d62728; stroke: #d62728" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-compiled-default" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="88.347188" transform="rotate(-0 84.72 88.347188)">torch_flash_compiled_default</text>
+    </g>
+    <g id="line2d_17">
+     <path d="M 56.72 99.803438  L 66.72 99.803438  L 76.72 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m7cd35be9cc" x="66.72" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-compiled-max-autotune" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="103.303438" transform="rotate(-0 84.72 103.303438)">torch_flash_compiled_max_autotune</text>
+    </g>
+    <g id="line2d_18">
+     <path d="M 56.72 114.759688  L 66.72 114.759688  L 76.72 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m5dea31a887" x="66.72" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
+     </g>
+    </g>
+    <g id="legend-label--hf-kernels-flash-attn" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="118.259688" transform="rotate(-0 84.72 118.259688)">hf_kernels_flash_attn</text>
+    </g>
+    <g id="line2d_19">
+     <path d="M 56.72 129.715938  L 66.72 129.715938  L 76.72 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m67b69c36d7" x="66.72" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
+     </g>
+    </g>
+    <g id="legend-label--hf-kernels-flash-attn3" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="133.215938" transform="rotate(-0 84.72 133.215938)">hf_kernels_flash_attn3</text>
+    </g>
+   </g>
+  </g>
+ </g>
+ <defs>
+  <clipPath id="p5d73e4651f">
+   <rect x="47.72" y="26.88" width="805.48" height="475.866298" />
+  </clipPath>
+ </defs>
+</svg>
+</div>
+
+<div class="artifact-preview artifact-csv">
+<table class="csv-table">
+<thead><tr>
+<th>Implementation</th>
+<th>Impl ID</th>
+<th>Workload</th>
+<th>Batch</th>
+<th>Seq Length</th>
+<th>Heads</th>
+<th>Head Dim</th>
+<th>Dtype</th>
+<th>Mean (ms)</th>
+<th>P10 (ms)</th>
+<th>P50 (ms)</th>
+<th>P90 (ms)</th>
+<th>Reps</th>
+<th>Peak Mem (MB)</th>
+<th>Backend</th>
+<th>Family</th>
+</tr></thead>
+<tbody>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.48577280044555665</td>
+<td>0.47836801409721375</td>
+<td>0.4803520143032074</td>
+<td>0.4827199876308441</td>
+<td>5</td>
+<td>83.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5229184031486511</td>
+<td>0.521727979183197</td>
+<td>0.5228800177574158</td>
+<td>0.5234559774398804</td>
+<td>5</td>
+<td>90.62</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6515967845916748</td>
+<td>0.6503999829292297</td>
+<td>0.650879979133606</td>
+<td>0.6513599753379822</td>
+<td>5</td>
+<td>95.06</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6807615995407105</td>
+<td>0.6797440052032471</td>
+<td>0.6808639764785767</td>
+<td>0.6815680265426636</td>
+<td>5</td>
+<td>99.88</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.711027193069458</td>
+<td>0.7058879733085632</td>
+<td>0.7121919989585876</td>
+<td>0.7131519913673401</td>
+<td>5</td>
+<td>103.81</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7391423940658569</td>
+<td>0.7369279861450195</td>
+<td>0.7383999824523926</td>
+<td>0.7408959865570068</td>
+<td>5</td>
+<td>109.12</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5875647902488709</td>
+<td>0.5863680243492126</td>
+<td>0.5874559879302979</td>
+<td>0.5876479744911194</td>
+<td>5</td>
+<td>83.38</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.653657603263855</td>
+<td>0.6485440135002136</td>
+<td>0.6537600159645081</td>
+<td>0.656544029712677</td>
+<td>5</td>
+<td>90.62</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7784512042999268</td>
+<td>0.774944007396698</td>
+<td>0.778656005859375</td>
+<td>0.7801600098609924</td>
+<td>5</td>
+<td>95.94</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7922943949699401</td>
+<td>0.791263997554779</td>
+<td>0.7924799919128418</td>
+<td>0.7927039861679077</td>
+<td>5</td>
+<td>100.0</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.848089587688446</td>
+<td>0.8444799780845642</td>
+<td>0.8470079898834229</td>
+<td>0.8499199748039246</td>
+<td>5</td>
+<td>103.81</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9523776054382325</td>
+<td>0.95004802942276</td>
+<td>0.9519039988517761</td>
+<td>0.9541119933128357</td>
+<td>5</td>
+<td>109.12</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.45066879987716674</td>
+<td>0.4474239945411682</td>
+<td>0.44921600818634033</td>
+<td>0.45241600275039673</td>
+<td>5</td>
+<td>83.38</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.47004159688949587</td>
+<td>0.4652479887008667</td>
+<td>0.4705919921398163</td>
+<td>0.4716799855232239</td>
+<td>5</td>
+<td>90.62</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6022783994674683</td>
+<td>0.5987840294837952</td>
+<td>0.6021760106086731</td>
+<td>0.6045759916305542</td>
+<td>5</td>
+<td>95.06</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6013055920600892</td>
+<td>0.6000319719314575</td>
+<td>0.600383996963501</td>
+<td>0.6016640067100525</td>
+<td>5</td>
+<td>99.88</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6408192038536071</td>
+<td>0.639136016368866</td>
+<td>0.6404479742050171</td>
+<td>0.6416320204734802</td>
+<td>5</td>
+<td>103.81</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6466111898422241</td>
+<td>0.6447359919548035</td>
+<td>0.6462399959564209</td>
+<td>0.6483839750289917</td>
+<td>5</td>
+<td>109.12</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.527347207069397</td>
+<td>0.5194560289382935</td>
+<td>0.5272960066795349</td>
+<td>0.5312960147857666</td>
+<td>5</td>
+<td>83.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5586367964744567</td>
+<td>0.5560640096664429</td>
+<td>0.5571519732475281</td>
+<td>0.5611839890480042</td>
+<td>5</td>
+<td>90.62</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6860736012458801</td>
+<td>0.6841920018196106</td>
+<td>0.6860160231590271</td>
+<td>0.6869760155677795</td>
+<td>5</td>
+<td>95.25</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7167360067367554</td>
+<td>0.7152000069618225</td>
+<td>0.7161920070648193</td>
+<td>0.7164160013198853</td>
+<td>5</td>
+<td>99.88</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7423295855522156</td>
+<td>0.7400959730148315</td>
+<td>0.742143988609314</td>
+<td>0.7431039810180664</td>
+<td>5</td>
+<td>103.81</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7743871927261352</td>
+<td>0.7718080282211304</td>
+<td>0.7745919823646545</td>
+<td>0.7748159766197205</td>
+<td>5</td>
+<td>109.12</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6489088058471679</td>
+<td>0.6148160099983215</td>
+<td>0.6296960115432739</td>
+<td>0.6522240042686462</td>
+<td>5</td>
+<td>67.5</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.700761592388153</td>
+<td>0.6615359783172607</td>
+<td>0.6821119785308838</td>
+<td>0.7128959894180298</td>
+<td>5</td>
+<td>75.0</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.834444797039032</td>
+<td>0.7967039942741394</td>
+<td>0.8164799809455872</td>
+<td>0.8463680148124695</td>
+<td>5</td>
+<td>80.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.8709375977516174</td>
+<td>0.8432319760322571</td>
+<td>0.8498560190200806</td>
+<td>0.8750079870223999</td>
+<td>5</td>
+<td>82.5</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9069631934165955</td>
+<td>0.8775359988212585</td>
+<td>0.9030719995498657</td>
+<td>0.903872013092041</td>
+<td>5</td>
+<td>86.25</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9371584057807922</td>
+<td>0.9145920276641846</td>
+<td>0.9164159893989563</td>
+<td>0.9357439875602722</td>
+<td>5</td>
+<td>90.0</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.34446719884872434</td>
+<td>0.3438720107078552</td>
+<td>0.3445119857788086</td>
+<td>0.34457600116729736</td>
+<td>5</td>
+<td>83.38</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.37571839094161985</td>
+<td>0.37404799461364746</td>
+<td>0.3763839900493622</td>
+<td>0.3766399919986725</td>
+<td>5</td>
+<td>90.62</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.4945920050144196</td>
+<td>0.4925439953804016</td>
+<td>0.493120014667511</td>
+<td>0.4938240051269531</td>
+<td>5</td>
+<td>95.06</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5139647841453552</td>
+<td>0.5123199820518494</td>
+<td>0.5142719745635986</td>
+<td>0.5147839784622192</td>
+<td>5</td>
+<td>99.88</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5353855967521668</td>
+<td>0.5339199900627136</td>
+<td>0.5350080132484436</td>
+<td>0.5352320075035095</td>
+<td>5</td>
+<td>103.81</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5548800110816956</td>
+<td>0.5538560152053833</td>
+<td>0.5548800230026245</td>
+<td>0.5553280115127563</td>
+<td>5</td>
+<td>109.12</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.3617343962192535</td>
+<td>0.36102399230003357</td>
+<td>0.3616960048675537</td>
+<td>0.36211198568344116</td>
+<td>5</td>
+<td>83.38</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.3907967984676361</td>
+<td>0.3885439932346344</td>
+<td>0.39056000113487244</td>
+<td>0.3906239867210388</td>
+<td>5</td>
+<td>90.62</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5228991985321045</td>
+<td>0.521344006061554</td>
+<td>0.5230720043182373</td>
+<td>0.5232319831848145</td>
+<td>5</td>
+<td>95.06</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5254656076431274</td>
+<td>0.523904025554657</td>
+<td>0.5249919891357422</td>
+<td>0.526528000831604</td>
+<td>5</td>
+<td>99.88</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5646592020988465</td>
+<td>0.5627840161323547</td>
+<td>0.565343976020813</td>
+<td>0.565343976020813</td>
+<td>5</td>
+<td>103.81</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5698879957199097</td>
+<td>0.567359983921051</td>
+<td>0.5696640014648438</td>
+<td>0.5698559880256653</td>
+<td>5</td>
+<td>109.12</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+</tbody>
+</table>
+</div>
+
 <div class="cell" id="cell-combine">
 <div class="cell-header">
 <span class="collapse-indicators">
 <span onclick="toggleCode('combine')" style="cursor: pointer;">▶ code</span> 
-<span onclick="toggleOutput('combine')" style="cursor: pointer;">▼ output</span>
+<span onclick="toggleOutput('combine')" style="cursor: pointer;">▶ output</span>
  <span id="uv-indicator-combine" onclick="toggleUvLogsFromHeader('combine')" style="cursor: pointer;">▶ uv-logs</span>
 </span> | 
-Cell: combine | 36.17s
+Cell: combine | 36.30s
  | <button class="run-btn" onclick="runCell('combine')">▶ run</button>
 <button class="copy-btn" onclick="copyCell('combine')">Copy</button>
 <a href="cells/combine.py" target="_blank" class="raw-btn">Raw</a>
 </div>
-<div id="code-combine" class="cell-code collapsed" data-lines="96">
+<div id="code-combine" class="cell-code collapsed" data-lines="319">
 <div class="highlight-with-lines">
 <div class="line-numbers" id="lines-combine">
 <a class="line-number" data-cell="combine" data-line="1" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 1, true);">1</a>
@@ -3830,6 +5190,229 @@ Cell: combine | 36.17s
 <a class="line-number" data-cell="combine" data-line="94" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 94, true);">94</a>
 <a class="line-number" data-cell="combine" data-line="95" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 95, true);">95</a>
 <a class="line-number" data-cell="combine" data-line="96" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 96, true);">96</a>
+<a class="line-number" data-cell="combine" data-line="97" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 97, true);">97</a>
+<a class="line-number" data-cell="combine" data-line="98" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 98, true);">98</a>
+<a class="line-number" data-cell="combine" data-line="99" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 99, true);">99</a>
+<a class="line-number" data-cell="combine" data-line="100" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 100, true);">100</a>
+<a class="line-number" data-cell="combine" data-line="101" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 101, true);">101</a>
+<a class="line-number" data-cell="combine" data-line="102" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 102, true);">102</a>
+<a class="line-number" data-cell="combine" data-line="103" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 103, true);">103</a>
+<a class="line-number" data-cell="combine" data-line="104" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 104, true);">104</a>
+<a class="line-number" data-cell="combine" data-line="105" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 105, true);">105</a>
+<a class="line-number" data-cell="combine" data-line="106" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 106, true);">106</a>
+<a class="line-number" data-cell="combine" data-line="107" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 107, true);">107</a>
+<a class="line-number" data-cell="combine" data-line="108" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 108, true);">108</a>
+<a class="line-number" data-cell="combine" data-line="109" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 109, true);">109</a>
+<a class="line-number" data-cell="combine" data-line="110" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 110, true);">110</a>
+<a class="line-number" data-cell="combine" data-line="111" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 111, true);">111</a>
+<a class="line-number" data-cell="combine" data-line="112" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 112, true);">112</a>
+<a class="line-number" data-cell="combine" data-line="113" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 113, true);">113</a>
+<a class="line-number" data-cell="combine" data-line="114" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 114, true);">114</a>
+<a class="line-number" data-cell="combine" data-line="115" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 115, true);">115</a>
+<a class="line-number" data-cell="combine" data-line="116" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 116, true);">116</a>
+<a class="line-number" data-cell="combine" data-line="117" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 117, true);">117</a>
+<a class="line-number" data-cell="combine" data-line="118" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 118, true);">118</a>
+<a class="line-number" data-cell="combine" data-line="119" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 119, true);">119</a>
+<a class="line-number" data-cell="combine" data-line="120" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 120, true);">120</a>
+<a class="line-number" data-cell="combine" data-line="121" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 121, true);">121</a>
+<a class="line-number" data-cell="combine" data-line="122" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 122, true);">122</a>
+<a class="line-number" data-cell="combine" data-line="123" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 123, true);">123</a>
+<a class="line-number" data-cell="combine" data-line="124" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 124, true);">124</a>
+<a class="line-number" data-cell="combine" data-line="125" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 125, true);">125</a>
+<a class="line-number" data-cell="combine" data-line="126" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 126, true);">126</a>
+<a class="line-number" data-cell="combine" data-line="127" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 127, true);">127</a>
+<a class="line-number" data-cell="combine" data-line="128" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 128, true);">128</a>
+<a class="line-number" data-cell="combine" data-line="129" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 129, true);">129</a>
+<a class="line-number" data-cell="combine" data-line="130" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 130, true);">130</a>
+<a class="line-number" data-cell="combine" data-line="131" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 131, true);">131</a>
+<a class="line-number" data-cell="combine" data-line="132" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 132, true);">132</a>
+<a class="line-number" data-cell="combine" data-line="133" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 133, true);">133</a>
+<a class="line-number" data-cell="combine" data-line="134" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 134, true);">134</a>
+<a class="line-number" data-cell="combine" data-line="135" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 135, true);">135</a>
+<a class="line-number" data-cell="combine" data-line="136" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 136, true);">136</a>
+<a class="line-number" data-cell="combine" data-line="137" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 137, true);">137</a>
+<a class="line-number" data-cell="combine" data-line="138" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 138, true);">138</a>
+<a class="line-number" data-cell="combine" data-line="139" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 139, true);">139</a>
+<a class="line-number" data-cell="combine" data-line="140" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 140, true);">140</a>
+<a class="line-number" data-cell="combine" data-line="141" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 141, true);">141</a>
+<a class="line-number" data-cell="combine" data-line="142" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 142, true);">142</a>
+<a class="line-number" data-cell="combine" data-line="143" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 143, true);">143</a>
+<a class="line-number" data-cell="combine" data-line="144" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 144, true);">144</a>
+<a class="line-number" data-cell="combine" data-line="145" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 145, true);">145</a>
+<a class="line-number" data-cell="combine" data-line="146" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 146, true);">146</a>
+<a class="line-number" data-cell="combine" data-line="147" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 147, true);">147</a>
+<a class="line-number" data-cell="combine" data-line="148" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 148, true);">148</a>
+<a class="line-number" data-cell="combine" data-line="149" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 149, true);">149</a>
+<a class="line-number" data-cell="combine" data-line="150" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 150, true);">150</a>
+<a class="line-number" data-cell="combine" data-line="151" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 151, true);">151</a>
+<a class="line-number" data-cell="combine" data-line="152" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 152, true);">152</a>
+<a class="line-number" data-cell="combine" data-line="153" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 153, true);">153</a>
+<a class="line-number" data-cell="combine" data-line="154" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 154, true);">154</a>
+<a class="line-number" data-cell="combine" data-line="155" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 155, true);">155</a>
+<a class="line-number" data-cell="combine" data-line="156" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 156, true);">156</a>
+<a class="line-number" data-cell="combine" data-line="157" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 157, true);">157</a>
+<a class="line-number" data-cell="combine" data-line="158" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 158, true);">158</a>
+<a class="line-number" data-cell="combine" data-line="159" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 159, true);">159</a>
+<a class="line-number" data-cell="combine" data-line="160" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 160, true);">160</a>
+<a class="line-number" data-cell="combine" data-line="161" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 161, true);">161</a>
+<a class="line-number" data-cell="combine" data-line="162" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 162, true);">162</a>
+<a class="line-number" data-cell="combine" data-line="163" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 163, true);">163</a>
+<a class="line-number" data-cell="combine" data-line="164" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 164, true);">164</a>
+<a class="line-number" data-cell="combine" data-line="165" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 165, true);">165</a>
+<a class="line-number" data-cell="combine" data-line="166" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 166, true);">166</a>
+<a class="line-number" data-cell="combine" data-line="167" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 167, true);">167</a>
+<a class="line-number" data-cell="combine" data-line="168" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 168, true);">168</a>
+<a class="line-number" data-cell="combine" data-line="169" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 169, true);">169</a>
+<a class="line-number" data-cell="combine" data-line="170" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 170, true);">170</a>
+<a class="line-number" data-cell="combine" data-line="171" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 171, true);">171</a>
+<a class="line-number" data-cell="combine" data-line="172" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 172, true);">172</a>
+<a class="line-number" data-cell="combine" data-line="173" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 173, true);">173</a>
+<a class="line-number" data-cell="combine" data-line="174" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 174, true);">174</a>
+<a class="line-number" data-cell="combine" data-line="175" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 175, true);">175</a>
+<a class="line-number" data-cell="combine" data-line="176" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 176, true);">176</a>
+<a class="line-number" data-cell="combine" data-line="177" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 177, true);">177</a>
+<a class="line-number" data-cell="combine" data-line="178" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 178, true);">178</a>
+<a class="line-number" data-cell="combine" data-line="179" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 179, true);">179</a>
+<a class="line-number" data-cell="combine" data-line="180" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 180, true);">180</a>
+<a class="line-number" data-cell="combine" data-line="181" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 181, true);">181</a>
+<a class="line-number" data-cell="combine" data-line="182" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 182, true);">182</a>
+<a class="line-number" data-cell="combine" data-line="183" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 183, true);">183</a>
+<a class="line-number" data-cell="combine" data-line="184" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 184, true);">184</a>
+<a class="line-number" data-cell="combine" data-line="185" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 185, true);">185</a>
+<a class="line-number" data-cell="combine" data-line="186" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 186, true);">186</a>
+<a class="line-number" data-cell="combine" data-line="187" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 187, true);">187</a>
+<a class="line-number" data-cell="combine" data-line="188" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 188, true);">188</a>
+<a class="line-number" data-cell="combine" data-line="189" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 189, true);">189</a>
+<a class="line-number" data-cell="combine" data-line="190" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 190, true);">190</a>
+<a class="line-number" data-cell="combine" data-line="191" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 191, true);">191</a>
+<a class="line-number" data-cell="combine" data-line="192" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 192, true);">192</a>
+<a class="line-number" data-cell="combine" data-line="193" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 193, true);">193</a>
+<a class="line-number" data-cell="combine" data-line="194" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 194, true);">194</a>
+<a class="line-number" data-cell="combine" data-line="195" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 195, true);">195</a>
+<a class="line-number" data-cell="combine" data-line="196" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 196, true);">196</a>
+<a class="line-number" data-cell="combine" data-line="197" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 197, true);">197</a>
+<a class="line-number" data-cell="combine" data-line="198" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 198, true);">198</a>
+<a class="line-number" data-cell="combine" data-line="199" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 199, true);">199</a>
+<a class="line-number" data-cell="combine" data-line="200" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 200, true);">200</a>
+<a class="line-number" data-cell="combine" data-line="201" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 201, true);">201</a>
+<a class="line-number" data-cell="combine" data-line="202" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 202, true);">202</a>
+<a class="line-number" data-cell="combine" data-line="203" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 203, true);">203</a>
+<a class="line-number" data-cell="combine" data-line="204" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 204, true);">204</a>
+<a class="line-number" data-cell="combine" data-line="205" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 205, true);">205</a>
+<a class="line-number" data-cell="combine" data-line="206" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 206, true);">206</a>
+<a class="line-number" data-cell="combine" data-line="207" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 207, true);">207</a>
+<a class="line-number" data-cell="combine" data-line="208" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 208, true);">208</a>
+<a class="line-number" data-cell="combine" data-line="209" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 209, true);">209</a>
+<a class="line-number" data-cell="combine" data-line="210" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 210, true);">210</a>
+<a class="line-number" data-cell="combine" data-line="211" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 211, true);">211</a>
+<a class="line-number" data-cell="combine" data-line="212" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 212, true);">212</a>
+<a class="line-number" data-cell="combine" data-line="213" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 213, true);">213</a>
+<a class="line-number" data-cell="combine" data-line="214" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 214, true);">214</a>
+<a class="line-number" data-cell="combine" data-line="215" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 215, true);">215</a>
+<a class="line-number" data-cell="combine" data-line="216" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 216, true);">216</a>
+<a class="line-number" data-cell="combine" data-line="217" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 217, true);">217</a>
+<a class="line-number" data-cell="combine" data-line="218" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 218, true);">218</a>
+<a class="line-number" data-cell="combine" data-line="219" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 219, true);">219</a>
+<a class="line-number" data-cell="combine" data-line="220" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 220, true);">220</a>
+<a class="line-number" data-cell="combine" data-line="221" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 221, true);">221</a>
+<a class="line-number" data-cell="combine" data-line="222" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 222, true);">222</a>
+<a class="line-number" data-cell="combine" data-line="223" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 223, true);">223</a>
+<a class="line-number" data-cell="combine" data-line="224" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 224, true);">224</a>
+<a class="line-number" data-cell="combine" data-line="225" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 225, true);">225</a>
+<a class="line-number" data-cell="combine" data-line="226" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 226, true);">226</a>
+<a class="line-number" data-cell="combine" data-line="227" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 227, true);">227</a>
+<a class="line-number" data-cell="combine" data-line="228" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 228, true);">228</a>
+<a class="line-number" data-cell="combine" data-line="229" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 229, true);">229</a>
+<a class="line-number" data-cell="combine" data-line="230" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 230, true);">230</a>
+<a class="line-number" data-cell="combine" data-line="231" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 231, true);">231</a>
+<a class="line-number" data-cell="combine" data-line="232" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 232, true);">232</a>
+<a class="line-number" data-cell="combine" data-line="233" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 233, true);">233</a>
+<a class="line-number" data-cell="combine" data-line="234" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 234, true);">234</a>
+<a class="line-number" data-cell="combine" data-line="235" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 235, true);">235</a>
+<a class="line-number" data-cell="combine" data-line="236" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 236, true);">236</a>
+<a class="line-number" data-cell="combine" data-line="237" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 237, true);">237</a>
+<a class="line-number" data-cell="combine" data-line="238" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 238, true);">238</a>
+<a class="line-number" data-cell="combine" data-line="239" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 239, true);">239</a>
+<a class="line-number" data-cell="combine" data-line="240" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 240, true);">240</a>
+<a class="line-number" data-cell="combine" data-line="241" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 241, true);">241</a>
+<a class="line-number" data-cell="combine" data-line="242" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 242, true);">242</a>
+<a class="line-number" data-cell="combine" data-line="243" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 243, true);">243</a>
+<a class="line-number" data-cell="combine" data-line="244" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 244, true);">244</a>
+<a class="line-number" data-cell="combine" data-line="245" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 245, true);">245</a>
+<a class="line-number" data-cell="combine" data-line="246" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 246, true);">246</a>
+<a class="line-number" data-cell="combine" data-line="247" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 247, true);">247</a>
+<a class="line-number" data-cell="combine" data-line="248" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 248, true);">248</a>
+<a class="line-number" data-cell="combine" data-line="249" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 249, true);">249</a>
+<a class="line-number" data-cell="combine" data-line="250" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 250, true);">250</a>
+<a class="line-number" data-cell="combine" data-line="251" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 251, true);">251</a>
+<a class="line-number" data-cell="combine" data-line="252" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 252, true);">252</a>
+<a class="line-number" data-cell="combine" data-line="253" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 253, true);">253</a>
+<a class="line-number" data-cell="combine" data-line="254" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 254, true);">254</a>
+<a class="line-number" data-cell="combine" data-line="255" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 255, true);">255</a>
+<a class="line-number" data-cell="combine" data-line="256" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 256, true);">256</a>
+<a class="line-number" data-cell="combine" data-line="257" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 257, true);">257</a>
+<a class="line-number" data-cell="combine" data-line="258" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 258, true);">258</a>
+<a class="line-number" data-cell="combine" data-line="259" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 259, true);">259</a>
+<a class="line-number" data-cell="combine" data-line="260" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 260, true);">260</a>
+<a class="line-number" data-cell="combine" data-line="261" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 261, true);">261</a>
+<a class="line-number" data-cell="combine" data-line="262" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 262, true);">262</a>
+<a class="line-number" data-cell="combine" data-line="263" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 263, true);">263</a>
+<a class="line-number" data-cell="combine" data-line="264" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 264, true);">264</a>
+<a class="line-number" data-cell="combine" data-line="265" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 265, true);">265</a>
+<a class="line-number" data-cell="combine" data-line="266" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 266, true);">266</a>
+<a class="line-number" data-cell="combine" data-line="267" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 267, true);">267</a>
+<a class="line-number" data-cell="combine" data-line="268" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 268, true);">268</a>
+<a class="line-number" data-cell="combine" data-line="269" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 269, true);">269</a>
+<a class="line-number" data-cell="combine" data-line="270" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 270, true);">270</a>
+<a class="line-number" data-cell="combine" data-line="271" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 271, true);">271</a>
+<a class="line-number" data-cell="combine" data-line="272" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 272, true);">272</a>
+<a class="line-number" data-cell="combine" data-line="273" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 273, true);">273</a>
+<a class="line-number" data-cell="combine" data-line="274" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 274, true);">274</a>
+<a class="line-number" data-cell="combine" data-line="275" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 275, true);">275</a>
+<a class="line-number" data-cell="combine" data-line="276" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 276, true);">276</a>
+<a class="line-number" data-cell="combine" data-line="277" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 277, true);">277</a>
+<a class="line-number" data-cell="combine" data-line="278" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 278, true);">278</a>
+<a class="line-number" data-cell="combine" data-line="279" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 279, true);">279</a>
+<a class="line-number" data-cell="combine" data-line="280" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 280, true);">280</a>
+<a class="line-number" data-cell="combine" data-line="281" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 281, true);">281</a>
+<a class="line-number" data-cell="combine" data-line="282" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 282, true);">282</a>
+<a class="line-number" data-cell="combine" data-line="283" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 283, true);">283</a>
+<a class="line-number" data-cell="combine" data-line="284" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 284, true);">284</a>
+<a class="line-number" data-cell="combine" data-line="285" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 285, true);">285</a>
+<a class="line-number" data-cell="combine" data-line="286" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 286, true);">286</a>
+<a class="line-number" data-cell="combine" data-line="287" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 287, true);">287</a>
+<a class="line-number" data-cell="combine" data-line="288" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 288, true);">288</a>
+<a class="line-number" data-cell="combine" data-line="289" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 289, true);">289</a>
+<a class="line-number" data-cell="combine" data-line="290" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 290, true);">290</a>
+<a class="line-number" data-cell="combine" data-line="291" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 291, true);">291</a>
+<a class="line-number" data-cell="combine" data-line="292" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 292, true);">292</a>
+<a class="line-number" data-cell="combine" data-line="293" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 293, true);">293</a>
+<a class="line-number" data-cell="combine" data-line="294" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 294, true);">294</a>
+<a class="line-number" data-cell="combine" data-line="295" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 295, true);">295</a>
+<a class="line-number" data-cell="combine" data-line="296" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 296, true);">296</a>
+<a class="line-number" data-cell="combine" data-line="297" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 297, true);">297</a>
+<a class="line-number" data-cell="combine" data-line="298" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 298, true);">298</a>
+<a class="line-number" data-cell="combine" data-line="299" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 299, true);">299</a>
+<a class="line-number" data-cell="combine" data-line="300" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 300, true);">300</a>
+<a class="line-number" data-cell="combine" data-line="301" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 301, true);">301</a>
+<a class="line-number" data-cell="combine" data-line="302" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 302, true);">302</a>
+<a class="line-number" data-cell="combine" data-line="303" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 303, true);">303</a>
+<a class="line-number" data-cell="combine" data-line="304" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 304, true);">304</a>
+<a class="line-number" data-cell="combine" data-line="305" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 305, true);">305</a>
+<a class="line-number" data-cell="combine" data-line="306" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 306, true);">306</a>
+<a class="line-number" data-cell="combine" data-line="307" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 307, true);">307</a>
+<a class="line-number" data-cell="combine" data-line="308" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 308, true);">308</a>
+<a class="line-number" data-cell="combine" data-line="309" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 309, true);">309</a>
+<a class="line-number" data-cell="combine" data-line="310" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 310, true);">310</a>
+<a class="line-number" data-cell="combine" data-line="311" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 311, true);">311</a>
+<a class="line-number" data-cell="combine" data-line="312" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 312, true);">312</a>
+<a class="line-number" data-cell="combine" data-line="313" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 313, true);">313</a>
+<a class="line-number" data-cell="combine" data-line="314" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 314, true);">314</a>
+<a class="line-number" data-cell="combine" data-line="315" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 315, true);">315</a>
+<a class="line-number" data-cell="combine" data-line="316" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 316, true);">316</a>
+<a class="line-number" data-cell="combine" data-line="317" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 317, true);">317</a>
+<a class="line-number" data-cell="combine" data-line="318" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 318, true);">318</a>
+<a class="line-number" data-cell="combine" data-line="319" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 319, true);">319</a>
 </div>
 <div class="code-wrap">
 <div class="highlight"><pre><span></span><span class="c1"># /// script</span>
@@ -3844,13 +5427,173 @@ Cell: combine | 36.17s
 <span class="c1"># [tool.uv.sources]</span>
 <span class="c1"># kernels-benchmark-tools = { git = &quot;https://github.com/drbh/kernels-benchmark-tools.git&quot;, branch = &quot;main&quot; }</span>
 <span class="c1"># ///</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">torch</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">sys</span>
 <span class="kn">import</span><span class="w"> </span><span class="nn">os</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">kernels_benchmark_tools</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">kbt</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">sys</span>
 <span class="kn">from</span><span class="w"> </span><span class="nn">pathlib</span><span class="w"> </span><span class="kn">import</span> <span class="n">Path</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">json</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">torch</span>  <span class="c1"># noqa: F401  # imported because upstream may expect torch to be importable</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">kernels_benchmark_tools</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">kbt</span>
+
+<span class="c1"># --- Matplotlib setup and helpers ------------------------------------------------</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">matplotlib</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">mpl</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">matplotlib.pyplot</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">plt</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">csv</span>
+
+
+<span class="c1"># Keep text as text (not paths) so CSS can style fonts, size, etc.</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;svg.fonttype&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
+<span class="c1"># Make ids deterministic across builds</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;svg.hashsalt&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;latency-benchmark-combined&quot;</span>
+<span class="c1"># Avoid auto-closed figures interfering with our tagging</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;figure.autolayout&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="kc">True</span>
+<span class="c1"># Make background transparent</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;figure.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;axes.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;savefig.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
+<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;savefig.edgecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
+
+<span class="k">def</span><span class="w"> </span><span class="nf">_slugify</span><span class="p">(</span><span class="n">s</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="nb">str</span><span class="p">:</span>
+    <span class="n">s</span> <span class="o">=</span> <span class="p">(</span><span class="n">s</span> <span class="ow">or</span> <span class="s2">&quot;&quot;</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">lower</span><span class="p">()</span>
+    <span class="n">keep</span> <span class="o">=</span> <span class="p">[]</span>
+    <span class="k">for</span> <span class="n">ch</span> <span class="ow">in</span> <span class="n">s</span><span class="p">:</span>
+        <span class="k">if</span> <span class="n">ch</span><span class="o">.</span><span class="n">isalnum</span><span class="p">():</span>
+            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">ch</span><span class="p">)</span>
+        <span class="k">elif</span> <span class="n">ch</span> <span class="ow">in</span> <span class="p">(</span><span class="s2">&quot; &quot;</span><span class="p">,</span> <span class="s2">&quot;-&quot;</span><span class="p">,</span> <span class="s2">&quot;_&quot;</span><span class="p">,</span> <span class="s2">&quot;/&quot;</span><span class="p">,</span> <span class="s2">&quot;.&quot;</span><span class="p">,</span> <span class="s2">&quot;:&quot;</span><span class="p">):</span>
+            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;-&quot;</span><span class="p">)</span>
+        <span class="k">else</span><span class="p">:</span>
+            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;&quot;</span><span class="p">)</span>
+    <span class="n">out</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">keep</span><span class="p">)</span>
+    <span class="k">while</span> <span class="s2">&quot;--&quot;</span> <span class="ow">in</span> <span class="n">out</span><span class="p">:</span>
+        <span class="n">out</span> <span class="o">=</span> <span class="n">out</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="s2">&quot;--&quot;</span><span class="p">,</span> <span class="s2">&quot;-&quot;</span><span class="p">)</span>
+    <span class="k">return</span> <span class="n">out</span><span class="o">.</span><span class="n">strip</span><span class="p">(</span><span class="s2">&quot;-&quot;</span><span class="p">)</span> <span class="ow">or</span> <span class="s2">&quot;unnamed&quot;</span>
+
+<span class="k">def</span><span class="w"> </span><span class="nf">_tag_current_figure</span><span class="p">(</span><span class="n">default_series_prefix</span><span class="o">=</span><span class="s2">&quot;series&quot;</span><span class="p">):</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;Attach SVG ids (gid) to key artists so they can be targeted from CSS.&quot;&quot;&quot;</span>
+    <span class="n">fig</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">gcf</span><span class="p">()</span>
+    <span class="k">if</span> <span class="n">fig</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>
+        <span class="k">return</span>
+
+    <span class="c1"># Tag the figure itself</span>
+    <span class="n">fig</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;figure--latency&quot;</span><span class="p">)</span>
+
+    <span class="k">for</span> <span class="n">ax_idx</span><span class="p">,</span> <span class="n">ax</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">fig</span><span class="o">.</span><span class="n">get_axes</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
+        <span class="n">ax</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;axes--</span><span class="si">{</span><span class="n">ax_idx</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+        <span class="c1"># Axis labels &amp; title</span>
+        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_title</span><span class="p">():</span>
+            <span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="n">ax</span><span class="o">.</span><span class="n">texts</span><span class="p">:</span>
+                <span class="k">if</span> <span class="n">t</span><span class="o">.</span><span class="n">get_text</span><span class="p">()</span> <span class="o">==</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_title</span><span class="p">():</span>
+                    <span class="n">t</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;title--main&quot;</span><span class="p">)</span>
+        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span> <span class="ow">and</span> <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span><span class="o">.</span><span class="n">get_label</span><span class="p">():</span>
+            <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span><span class="o">.</span><span class="n">label</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;label--x&quot;</span><span class="p">)</span>
+        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span> <span class="ow">and</span> <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span><span class="o">.</span><span class="n">get_label</span><span class="p">():</span>
+            <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span><span class="o">.</span><span class="n">label</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;label--y&quot;</span><span class="p">)</span>
+
+        <span class="c1"># Gridlines</span>
+        <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">gl</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">ax</span><span class="o">.</span><span class="n">get_xgridlines</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
+            <span class="n">gl</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;grid-x--</span><span class="si">{</span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+        <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">gl</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">ax</span><span class="o">.</span><span class="n">get_ygridlines</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
+            <span class="n">gl</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;grid-y--</span><span class="si">{</span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+        <span class="c1"># Legend block &amp; entries</span>
+        <span class="n">leg</span> <span class="o">=</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_legend</span><span class="p">()</span>
+        <span class="k">if</span> <span class="n">leg</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
+            <span class="n">leg</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">)</span>
+            <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">txt</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">leg</span><span class="o">.</span><span class="n">get_texts</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
+                <span class="n">label_slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">txt</span><span class="o">.</span><span class="n">get_text</span><span class="p">())</span>
+                <span class="n">txt</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;legend-label--</span><span class="si">{</span><span class="n">label_slug</span><span class="w"> </span><span class="ow">or</span><span class="w"> </span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+        <span class="c1"># Series (lines, patches)</span>
+        <span class="c1"># Lines</span>
+        <span class="n">line_seen</span> <span class="o">=</span> <span class="p">{}</span>
+        <span class="k">for</span> <span class="n">ln</span> <span class="ow">in</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">ax</span><span class="p">,</span> <span class="s2">&quot;lines&quot;</span><span class="p">,</span> <span class="p">[]):</span>
+            <span class="n">raw_label</span> <span class="o">=</span> <span class="n">ln</span><span class="o">.</span><span class="n">get_label</span><span class="p">()</span> <span class="ow">or</span> <span class="s2">&quot;&quot;</span>
+            <span class="c1"># Matplotlib uses labels beginning with &quot;_&quot; for non-legendable items</span>
+            <span class="n">label</span> <span class="o">=</span> <span class="n">raw_label</span> <span class="k">if</span> <span class="ow">not</span> <span class="n">raw_label</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;_&quot;</span><span class="p">)</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">default_series_prefix</span><span class="si">}</span><span class="s2">&quot;</span>
+            <span class="n">slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">label</span><span class="p">)</span>
+            <span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">=</span> <span class="n">line_seen</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">slug</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">+</span> <span class="mi">1</span>
+            <span class="n">suffix</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span> <span class="k">if</span> <span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">==</span> <span class="mi">1</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;-</span><span class="si">{</span><span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span><span class="si">}</span><span class="s2">&quot;</span>
+            <span class="n">ln</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;series--</span><span class="si">{</span><span class="n">slug</span><span class="si">}{</span><span class="n">suffix</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+        <span class="c1"># Patches (bars, areas)</span>
+        <span class="n">patch_seen</span> <span class="o">=</span> <span class="p">{}</span>
+        <span class="k">for</span> <span class="n">pt</span> <span class="ow">in</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">ax</span><span class="p">,</span> <span class="s2">&quot;patches&quot;</span><span class="p">,</span> <span class="p">[]):</span>
+            <span class="n">label</span> <span class="o">=</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">pt</span><span class="p">,</span> <span class="s2">&quot;get_label&quot;</span><span class="p">,</span> <span class="k">lambda</span><span class="p">:</span> <span class="s2">&quot;&quot;</span><span class="p">)()</span> <span class="ow">or</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">default_series_prefix</span><span class="si">}</span><span class="s2">&quot;</span>
+            <span class="k">if</span> <span class="nb">isinstance</span><span class="p">(</span><span class="n">label</span><span class="p">,</span> <span class="nb">str</span><span class="p">)</span> <span class="ow">and</span> <span class="n">label</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;_&quot;</span><span class="p">):</span>
+                <span class="n">label</span> <span class="o">=</span> <span class="n">default_series_prefix</span>
+            <span class="n">slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">label</span><span class="p">)</span>
+            <span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">=</span> <span class="n">patch_seen</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">slug</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">+</span> <span class="mi">1</span>
+            <span class="n">suffix</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span> <span class="k">if</span> <span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">==</span> <span class="mi">1</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;-</span><span class="si">{</span><span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span><span class="si">}</span><span class="s2">&quot;</span>
+            <span class="n">pt</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;series--</span><span class="si">{</span><span class="n">slug</span><span class="si">}{</span><span class="n">suffix</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+<span class="k">def</span><span class="w"> </span><span class="nf">_postprocess_svg_add_classes</span><span class="p">(</span><span class="n">svg_path</span><span class="p">:</span> <span class="n">Path</span><span class="p">):</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;Add convenient CSS classes alongside ids (e.g., class=&#39;series grid grid-x&#39;).&quot;&quot;&quot;</span>
+    <span class="k">try</span><span class="p">:</span>
+        <span class="kn">import</span><span class="w"> </span><span class="nn">xml.etree.ElementTree</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">ET</span>
+        <span class="n">ET</span><span class="o">.</span><span class="n">register_namespace</span><span class="p">(</span><span class="s2">&quot;&quot;</span><span class="p">,</span> <span class="s2">&quot;http://www.w3.org/2000/svg&quot;</span><span class="p">)</span>
+        <span class="n">tree</span> <span class="o">=</span> <span class="n">ET</span><span class="o">.</span><span class="n">parse</span><span class="p">(</span><span class="n">svg_path</span><span class="p">)</span>
+        <span class="n">root</span> <span class="o">=</span> <span class="n">tree</span><span class="o">.</span><span class="n">getroot</span><span class="p">()</span>
+        <span class="k">for</span> <span class="n">el</span> <span class="ow">in</span> <span class="n">root</span><span class="o">.</span><span class="n">iter</span><span class="p">():</span>
+            <span class="n">el_id</span> <span class="o">=</span> <span class="n">el</span><span class="o">.</span><span class="n">attrib</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">&quot;id&quot;</span><span class="p">,</span> <span class="s2">&quot;&quot;</span><span class="p">)</span>
+            <span class="k">if</span> <span class="ow">not</span> <span class="n">el_id</span><span class="p">:</span>
+                <span class="k">continue</span>
+            <span class="bp">cls</span> <span class="o">=</span> <span class="p">[]</span>
+            <span class="k">if</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;figure--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;figure&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;axes--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;axes&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;grid-x--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span> <span class="o">+=</span> <span class="p">[</span><span class="s2">&quot;grid&quot;</span><span class="p">,</span> <span class="s2">&quot;grid-x&quot;</span><span class="p">]</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;grid-y--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span> <span class="o">+=</span> <span class="p">[</span><span class="s2">&quot;grid&quot;</span><span class="p">,</span> <span class="s2">&quot;grid-y&quot;</span><span class="p">]</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;label--x&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;xlabel&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;label--y&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;ylabel&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;title--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;title&quot;</span><span class="p">)</span>
+            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;series--&quot;</span><span class="p">):</span>
+                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;series&quot;</span><span class="p">)</span>
+            <span class="k">if</span> <span class="bp">cls</span><span class="p">:</span>
+                <span class="c1"># Preserve any existing class (unlikely from Matplotlib)</span>
+                <span class="n">existing</span> <span class="o">=</span> <span class="n">el</span><span class="o">.</span><span class="n">attrib</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">&quot;class&quot;</span><span class="p">,</span> <span class="s2">&quot;&quot;</span><span class="p">)</span>
+                <span class="n">el</span><span class="o">.</span><span class="n">set</span><span class="p">(</span><span class="s2">&quot;class&quot;</span><span class="p">,</span> <span class="p">(</span><span class="n">existing</span> <span class="o">+</span> <span class="s2">&quot; &quot;</span> <span class="o">+</span> <span class="s2">&quot; &quot;</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="bp">cls</span><span class="p">))</span><span class="o">.</span><span class="n">strip</span><span class="p">())</span>
+        <span class="n">tree</span><span class="o">.</span><span class="n">write</span><span class="p">(</span><span class="n">svg_path</span><span class="p">,</span> <span class="n">encoding</span><span class="o">=</span><span class="s2">&quot;utf-8&quot;</span><span class="p">,</span> <span class="n">xml_declaration</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+    <span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
+        <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ SVG postprocess (classes) skipped: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+<span class="c1"># Monkey-patch savefig to force SVG &amp; ensure tagging occurs even if kbt.viz saves internally.</span>
+<span class="n">_orig_savefig</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span>
+<span class="k">def</span><span class="w"> </span><span class="nf">_savefig_svg</span><span class="p">(</span><span class="n">fname</span><span class="p">,</span> <span class="o">*</span><span class="n">args</span><span class="p">,</span> <span class="o">**</span><span class="n">kwargs</span><span class="p">):</span>
+    <span class="c1"># Always save as SVG at a stable path for the artifact system</span>
+    <span class="n">out</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">)</span>
+    <span class="n">kwargs</span><span class="p">[</span><span class="s2">&quot;format&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;svg&quot;</span>
+    <span class="c1"># Ensure everything we care about has ids before export</span>
+    <span class="n">_tag_current_figure</span><span class="p">()</span>
+    <span class="n">res</span> <span class="o">=</span> <span class="n">_orig_savefig</span><span class="p">(</span><span class="n">out</span><span class="p">,</span> <span class="o">*</span><span class="n">args</span><span class="p">,</span> <span class="o">**</span><span class="n">kwargs</span><span class="p">)</span>
+    <span class="c1"># Add helpful CSS classes on top of ids</span>
+    <span class="n">_postprocess_svg_add_classes</span><span class="p">(</span><span class="n">out</span><span class="p">)</span>
+    <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ Combined visualization saved as </span><span class="si">{</span><span class="n">out</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+    <span class="k">return</span> <span class="n">res</span>
+
+<span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_savefig_svg</span>  <span class="c1"># apply patch</span>
+
+<span class="c1"># Capture close calls in case kbt.viz() closes figures before we re-save</span>
+<span class="n">_orig_close</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">close</span>
+<span class="n">_last_closed</span> <span class="o">=</span> <span class="p">{</span><span class="s2">&quot;fig&quot;</span><span class="p">:</span> <span class="kc">None</span><span class="p">}</span>
+<span class="k">def</span><span class="w"> </span><span class="nf">_capture_close</span><span class="p">(</span><span class="n">arg</span><span class="o">=</span><span class="kc">None</span><span class="p">):</span>
+    <span class="k">try</span><span class="p">:</span>
+        <span class="k">if</span> <span class="nb">hasattr</span><span class="p">(</span><span class="n">arg</span><span class="p">,</span> <span class="s2">&quot;savefig&quot;</span><span class="p">):</span>  <span class="c1"># looks like a Figure</span>
+            <span class="n">_last_closed</span><span class="p">[</span><span class="s2">&quot;fig&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">arg</span>
+        <span class="k">else</span><span class="p">:</span>
+            <span class="n">_last_closed</span><span class="p">[</span><span class="s2">&quot;fig&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">gcf</span><span class="p">()</span>
+    <span class="k">finally</span><span class="p">:</span>
+        <span class="k">return</span> <span class="n">_orig_close</span><span class="p">(</span><span class="n">arg</span><span class="p">)</span>
+<span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_capture_close</span>
 
-<span class="c1"># Discover the upstream artifact directories from environment variables</span>
+<span class="c1"># --- Locate benchmark artifacts --------------------------------------------------</span>
 <span class="n">cache_dirs</span> <span class="o">=</span> <span class="p">{</span>
     <span class="s2">&quot;Flash (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_FLASH_ATTENTION_BENCHMARK&#39;</span><span class="p">),</span>
     <span class="s2">&quot;MemEff (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_MEM_EFFICIENT_ATTENTION_BENCHMARK&#39;</span><span class="p">),</span>
@@ -3868,8 +5611,6 @@ Cell: combine | 36.17s
     <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">name</span><span class="si">:</span><span class="s2">30s</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">cache_dir</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
 <span class="nb">print</span><span class="p">()</span>
 
-<span class="c1"># Collect all JSONL paths</span>
-<span class="n">all_paths</span> <span class="o">=</span> <span class="p">[]</span>
 <span class="n">file_mapping</span> <span class="o">=</span> <span class="p">{</span>
     <span class="s2">&quot;Flash (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
     <span class="s2">&quot;MemEff (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
@@ -3882,10 +5623,10 @@ Cell: combine | 36.17s
     <span class="s2">&quot;HF Kernels Flash Attn3&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
 <span class="p">}</span>
 
+<span class="n">all_paths</span> <span class="o">=</span> <span class="p">[]</span>
 <span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
     <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
-        <span class="n">jsonl_file</span> <span class="o">=</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
-        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">jsonl_file</span>
+        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
         <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
             <span class="n">all_paths</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="nb">str</span><span class="p">(</span><span class="n">path</span><span class="p">))</span>
             <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ Found </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
@@ -3893,30 +5634,40 @@ Cell: combine | 36.17s
             <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;⊘ Empty/Missing </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
     <span class="k">else</span><span class="p">:</span>
         <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ No cache dir for </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
 <span class="nb">print</span><span class="p">()</span>
 
 <span class="k">if</span> <span class="ow">not</span> <span class="n">all_paths</span><span class="p">:</span>
     <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;ERROR: No benchmark data files found!&quot;</span><span class="p">)</span>
+    <span class="c1"># restore patched functions before exiting</span>
+    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_orig_savefig</span>
+    <span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_orig_close</span>
     <span class="n">sys</span><span class="o">.</span><span class="n">exit</span><span class="p">(</span><span class="mi">1</span><span class="p">)</span>
 
-<span class="c1"># Generate combined summary</span>
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;COMBINED BENCHMARK SUMMARY&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">()</span>
-
+<span class="c1"># --- Summary + Visualization -----------------------------------------------------</span>
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;COMBINED BENCHMARK SUMMARY</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
 <span class="n">kbt</span><span class="o">.</span><span class="n">summarize</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
-
-<span class="nb">print</span><span class="p">()</span>
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;GENERATING COMBINED VISUALIZATION&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">()</span>
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">GENERATING COMBINED VISUALIZATION</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
 
 <span class="k">try</span><span class="p">:</span>
+    <span class="c1"># If kbt.viz saves internally, our patched savefig ensures SVG gets written,</span>
+    <span class="c1"># and it will carry ids/classes for CSS styling.</span>
     <span class="n">kbt</span><span class="o">.</span><span class="n">viz</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
-    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;✓ Combined visualization saved as latency.png&quot;</span><span class="p">)</span>
+    <span class="c1"># Safety net: if kbt.viz didn&#39;t save, save now.</span>
+    <span class="c1"># if not Path(&quot;latency.svg&quot;).exists():</span>
+    <span class="c1">#     _tag_current_figure()</span>
+    <span class="c1"># plt.savefig(&quot;latency.svg&quot;)</span>
+
+    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">)</span>  <span class="c1"># ensure saved with tagging</span>
+
+    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;✓ SVG visualization ready: latency.svg!&quot;</span><span class="p">)</span>
 <span class="k">except</span> <span class="ne">ImportError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
     <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ Visualization requires matplotlib: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
 <span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
     <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ Visualization failed: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+<span class="k">finally</span><span class="p">:</span>
+    <span class="c1"># Clean up patches to avoid side effects in later cells</span>
+    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_orig_savefig</span>
+    <span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_orig_close</span>
 
 <span class="nb">print</span><span class="p">()</span>
 <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;ANALYSIS COMPLETE&quot;</span><span class="p">)</span>
@@ -3924,17 +5675,72 @@ Cell: combine | 36.17s
 <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">Implementations included:&quot;</span><span class="p">)</span>
 <span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
     <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
-        <span class="n">jsonl_file</span> <span class="o">=</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
-        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">jsonl_file</span>
+        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
         <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
             <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;  ✓ </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+
+
+
+<span class="c1"># Collect all benchmark data and export to CSV</span>
+<span class="n">all_data</span> <span class="o">=</span> <span class="p">{}</span>
+<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
+    <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
+        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
+        <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
+            <span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">path</span><span class="p">,</span> <span class="s1">&#39;r&#39;</span><span class="p">)</span> <span class="k">as</span> <span class="n">f</span><span class="p">:</span>
+                <span class="n">records</span> <span class="o">=</span> <span class="p">[</span><span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">line</span><span class="p">)</span> <span class="k">for</span> <span class="n">line</span> <span class="ow">in</span> <span class="n">f</span><span class="p">]</span>
+                <span class="n">all_data</span><span class="p">[</span><span class="n">name</span><span class="p">]</span> <span class="o">=</span> <span class="n">records</span>
+
+<span class="c1"># Export to CSV</span>
+<span class="n">csv_path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="s2">&quot;latency.csv&quot;</span><span class="p">)</span>
+<span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">csv_path</span><span class="p">,</span> <span class="s1">&#39;w&#39;</span><span class="p">,</span> <span class="n">newline</span><span class="o">=</span><span class="s1">&#39;&#39;</span><span class="p">)</span> <span class="k">as</span> <span class="n">csvfile</span><span class="p">:</span>
+    <span class="n">writer</span> <span class="o">=</span> <span class="n">csv</span><span class="o">.</span><span class="n">writer</span><span class="p">(</span><span class="n">csvfile</span><span class="p">)</span>
+
+    <span class="c1"># Write header</span>
+    <span class="n">header</span> <span class="o">=</span> <span class="p">[</span><span class="s2">&quot;Implementation&quot;</span><span class="p">,</span> <span class="s2">&quot;Impl ID&quot;</span><span class="p">,</span> <span class="s2">&quot;Workload&quot;</span><span class="p">,</span> <span class="s2">&quot;Batch&quot;</span><span class="p">,</span> <span class="s2">&quot;Seq Length&quot;</span><span class="p">,</span> <span class="s2">&quot;Heads&quot;</span><span class="p">,</span> <span class="s2">&quot;Head Dim&quot;</span><span class="p">,</span> <span class="s2">&quot;Dtype&quot;</span><span class="p">,</span>
+              <span class="s2">&quot;Mean (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P10 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P50 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P90 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;Reps&quot;</span><span class="p">,</span> 
+            <span class="c1">#   &quot;Compile (ms)&quot;, </span>
+              <span class="s2">&quot;Peak Mem (MB)&quot;</span><span class="p">,</span> <span class="s2">&quot;Backend&quot;</span><span class="p">,</span> <span class="s2">&quot;Family&quot;</span><span class="p">]</span>
+    <span class="n">writer</span><span class="o">.</span><span class="n">writerow</span><span class="p">(</span><span class="n">header</span><span class="p">)</span>
+
+    <span class="c1"># Write data rows</span>
+    <span class="k">for</span> <span class="n">impl_name</span><span class="p">,</span> <span class="n">records</span> <span class="ow">in</span> <span class="n">all_data</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
+        <span class="k">for</span> <span class="n">record</span> <span class="ow">in</span> <span class="n">records</span><span class="p">:</span>
+            <span class="n">wl</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;wl&#39;</span><span class="p">,</span> <span class="p">{})</span>
+            <span class="n">lat</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;lat_ms&#39;</span><span class="p">,</span> <span class="p">{})</span>
+            <span class="n">tags</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;tags&#39;</span><span class="p">,</span> <span class="p">{})</span>
+
+            <span class="n">row</span> <span class="o">=</span> <span class="p">[</span>
+                <span class="n">impl_name</span><span class="p">,</span>
+                <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;impl&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;name&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;batch&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;seq_len&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;heads&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;head_dim&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;dtype&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;mean&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p10&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p50&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p90&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;reps&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="c1"># record.get(&#39;compile_ms&#39;, &#39;&#39;),</span>
+                <span class="nb">round</span><span class="p">(</span><span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;peak_bytes&#39;</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">/</span> <span class="mi">1024</span> <span class="o">/</span> <span class="mi">1024</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span> <span class="k">if</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;peak_bytes&#39;</span><span class="p">)</span> <span class="k">else</span> <span class="s1">&#39;&#39;</span><span class="p">,</span>
+                <span class="n">tags</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;backend&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+                <span class="n">tags</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;family&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
+            <span class="p">]</span>
+            <span class="n">writer</span><span class="o">.</span><span class="n">writerow</span><span class="p">(</span><span class="n">row</span><span class="p">)</span>
+
+<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ CSV export complete: </span><span class="si">{</span><span class="n">csv_path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Total implementations: </span><span class="si">{</span><span class="nb">len</span><span class="p">(</span><span class="n">all_data</span><span class="p">)</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Total records: </span><span class="si">{</span><span class="nb">sum</span><span class="p">(</span><span class="nb">len</span><span class="p">(</span><span class="n">records</span><span class="p">)</span><span class="w"> </span><span class="k">for</span><span class="w"> </span><span class="n">records</span><span class="w"> </span><span class="ow">in</span><span class="w"> </span><span class="n">all_data</span><span class="o">.</span><span class="n">values</span><span class="p">())</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
 </pre></div>
 
 <div class="code-line-highlight" id="line-highlight-combine"></div>
 </div>
 </div>
 </div>
-<div id="output-combine" class="cell-output">
+<div id="output-combine" class="cell-output collapsed">
 <div class="cell-stdout">LOADING BENCHMARK DATA
 Flash (PyTorch SDPA)          : /repo/flash_attn/impls/.uvnote/cache/327a3408e7cdfeef6984786686ce13137074d9f083e6e434c29f02589d28a0f8
 MemEff (PyTorch SDPA)         : /repo/flash_attn/impls/.uvnote/cache/25ca9e52daa50b9289780b3e1302f2949db718140ef9eedd44a8a554afaff9ee
@@ -3943,7 +5749,7 @@ xFormers                      : /repo/flash_attn/impls/.uvnote/cache/6802a31176f
 SageAttention                 : None
 Compiled (default)            : /repo/flash_attn/impls/.uvnote/cache/bd779935ea10d468a5a99c29b029da0e0ef4dc2a7b82bc8595d04b2f142a3a44
 Compiled (max-autotune)       : /repo/flash_attn/impls/.uvnote/cache/f4bc4785407df53e53f91c190279cdf3dbe3cf7028e2e352d1cc90b92bfcf86e
-HF Kernels Flash Attn         : /repo/flash_attn/impls/.uvnote/cache/58c243a8f4effc711ed67ad97c7fbf2124304388a17b4b8e4e43e20e6019e9c9
+HF Kernels Flash Attn         : /repo/flash_attn/impls/.uvnote/cache/e4c157a6bfc7f8394530835e3b63d4e2032ebfed3f19a0693978eb24ba415910
 HF Kernels Flash Attn3        : /repo/flash_attn/impls/.uvnote/cache/65da999faf55d11c76155fa1d198e77708e1fe8247e3d0b5fd7093a206551ce5
 
 ✓ Found Flash (PyTorch SDPA): /repo/flash_attn/impls/.uvnote/cache/327a3408e7cdfeef6984786686ce13137074d9f083e6e434c29f02589d28a0f8/attn.jsonl
@@ -3953,38 +5759,38 @@ HF Kernels Flash Attn3        : /repo/flash_attn/impls/.uvnote/cache/65da999faf5
 ✗ No cache dir for SageAttention
 ✓ Found Compiled (default): /repo/flash_attn/impls/.uvnote/cache/bd779935ea10d468a5a99c29b029da0e0ef4dc2a7b82bc8595d04b2f142a3a44/attn_default.jsonl
 ✓ Found Compiled (max-autotune): /repo/flash_attn/impls/.uvnote/cache/f4bc4785407df53e53f91c190279cdf3dbe3cf7028e2e352d1cc90b92bfcf86e/attn_max_autotune.jsonl
-✓ Found HF Kernels Flash Attn: /repo/flash_attn/impls/.uvnote/cache/58c243a8f4effc711ed67ad97c7fbf2124304388a17b4b8e4e43e20e6019e9c9/attn.jsonl
+✓ Found HF Kernels Flash Attn: /repo/flash_attn/impls/.uvnote/cache/e4c157a6bfc7f8394530835e3b63d4e2032ebfed3f19a0693978eb24ba415910/attn.jsonl
 ✓ Found HF Kernels Flash Attn3: /repo/flash_attn/impls/.uvnote/cache/65da999faf55d11c76155fa1d198e77708e1fe8247e3d0b5fd7093a206551ce5/attn.jsonl
 
 COMBINED BENCHMARK SUMMARY
 
 impl                     wl                  p50(ms)  ok
 hf_kernels_flash_attn    flux_L128              0.34  True
-hf_kernels_flash_attn    flux_L256              0.37  True
+hf_kernels_flash_attn    flux_L256              0.38  True
 hf_kernels_flash_attn    flux_L320              0.49  True
 hf_kernels_flash_attn    flux_L384              0.51  True
-hf_kernels_flash_attn    flux_L448              0.53  True
-hf_kernels_flash_attn    flux_L512              0.56  True
+hf_kernels_flash_attn    flux_L448              0.54  True
+hf_kernels_flash_attn    flux_L512              0.55  True
 hf_kernels_flash_attn3   flux_L128              0.36  True
 hf_kernels_flash_attn3   flux_L256              0.39  True
 hf_kernels_flash_attn3   flux_L320              0.52  True
-hf_kernels_flash_attn3   flux_L384              0.53  True
+hf_kernels_flash_attn3   flux_L384              0.52  True
 hf_kernels_flash_attn3   flux_L448              0.57  True
 hf_kernels_flash_attn3   flux_L512              0.57  True
-torch_flash_compiled_default flux_L128              0.52  True
+torch_flash_compiled_default flux_L128              0.53  True
 torch_flash_compiled_default flux_L256              0.56  True
 torch_flash_compiled_default flux_L320              0.69  True
 torch_flash_compiled_default flux_L384              0.72  True
 torch_flash_compiled_default flux_L448              0.74  True
 torch_flash_compiled_default flux_L512              0.77  True
-torch_flash_compiled_max_autotune flux_L128              0.65  True
+torch_flash_compiled_max_autotune flux_L128              0.63  True
 torch_flash_compiled_max_autotune flux_L256              0.68  True
 torch_flash_compiled_max_autotune flux_L320              0.82  True
 torch_flash_compiled_max_autotune flux_L384              0.85  True
-torch_flash_compiled_max_autotune flux_L448              0.88  True
+torch_flash_compiled_max_autotune flux_L448              0.90  True
 torch_flash_compiled_max_autotune flux_L512              0.92  True
 torch_flash_ma           flux_L128              0.48  True
-torch_flash_ma           flux_L256              0.53  True
+torch_flash_ma           flux_L256              0.52  True
 torch_flash_ma           flux_L320              0.65  True
 torch_flash_ma           flux_L384              0.68  True
 torch_flash_ma           flux_L448              0.71  True
@@ -4000,13 +5806,15 @@ xformers_meff            flux_L256              0.47  True
 xformers_meff            flux_L320              0.60  True
 xformers_meff            flux_L384              0.60  True
 xformers_meff            flux_L448              0.64  True
-xformers_meff            flux_L512              0.64  True
+xformers_meff            flux_L512              0.65  True
 
 GENERATING COMBINED VISUALIZATION
 
 Loaded 42 records
+✓ Combined visualization saved as latency.svg
 Saved latency.png
-✓ Combined visualization saved as latency.png
+✓ Combined visualization saved as latency.svg
+✓ SVG visualization ready: latency.svg!
 
 ANALYSIS COMPLETE
 Total implementations analyzed: 7
@@ -4019,44 +5827,47 @@ Implementations included:
   ✓ Compiled (max-autotune)
   ✓ HF Kernels Flash Attn
   ✓ HF Kernels Flash Attn3
+✓ CSV export complete: latency.csv
+Total implementations: 7
+Total records: 42
 </div>
 <div class="uv-install-logs" id="uv-logs-combine">
 <div class="uv-logs-header" onclick="toggleUvLogs(this)">▶ UV Install Logs</div>
 <div class="uv-logs-content" style="display: none;">
    Updating https://github.com/drbh/kernels-benchmark-tools.git (main)
-Downloading nvidia-cufile-cu12 (1.1MiB)
 Downloading fonttools (4.7MiB)
-Downloading nvidia-cusparse-cu12 (274.9MiB)
-Downloading nvidia-cuda-nvrtc-cu12 (84.0MiB)
-Downloading nvidia-cusparselt-cu12 (273.9MiB)
-Downloading nvidia-nccl-cu12 (307.4MiB)
-Downloading networkx (1.9MiB)
-Downloading triton (148.3MiB)
-Downloading setuptools (1.1MiB)
-Downloading nvidia-nvjitlink-cu12 (37.4MiB)
+Downloading nvidia-cufft-cu12 (184.2MiB)
+Downloading numpy (16.2MiB)
+Downloading pillow (6.3MiB)
+Downloading nvidia-cublas-cu12 (566.8MiB)
 Downloading sympy (6.0MiB)
-Downloading torch (846.9MiB)
 Downloading nvidia-cuda-cupti-cu12 (9.8MiB)
-Downloading nvidia-cublas-cu12 (566.8MiB)
-Downloading nvidia-curand-cu12 (60.7MiB)
-Downloading nvidia-cufft-cu12 (184.2MiB)
-Downloading matplotlib (8.3MiB)
-Downloading nvidia-cudnn-cu12 (674.0MiB)
+Downloading setuptools (1.1MiB)
 Downloading kiwisolver (1.4MiB)
+Downloading networkx (1.9MiB)
+Downloading nvidia-cudnn-cu12 (674.0MiB)
+Downloading matplotlib (8.3MiB)
+Downloading nvidia-cuda-nvrtc-cu12 (84.0MiB)
+Downloading triton (148.3MiB)
+Downloading nvidia-cusparse-cu12 (274.9MiB)
+Downloading nvidia-nccl-cu12 (307.4MiB)
+Downloading torch (846.9MiB)
+Downloading nvidia-nvjitlink-cu12 (37.4MiB)
 Downloading nvidia-cusolver-cu12 (255.1MiB)
-Downloading pillow (6.3MiB)
-Downloading numpy (16.2MiB)
+Downloading nvidia-curand-cu12 (60.7MiB)
+Downloading nvidia-cusparselt-cu12 (273.9MiB)
+Downloading nvidia-cufile-cu12 (1.1MiB)
     Updated https://github.com/drbh/kernels-benchmark-tools.git (f457279bca6573cd2fa54a74e67118f5e6b7a31c)
    Building kernels-benchmark-tools @ git+https://github.com/drbh/kernels-benchmark-tools.git@f457279bca6573cd2fa54a74e67118f5e6b7a31c
  Downloading nvidia-cufile-cu12
  Downloading kiwisolver
  Downloading setuptools
- Downloading networkx
  Downloading fonttools
+ Downloading networkx
  Downloading pillow
       Built kernels-benchmark-tools @ git+https://github.com/drbh/kernels-benchmark-tools.git@f457279bca6573cd2fa54a74e67118f5e6b7a31c
- Downloading matplotlib
  Downloading nvidia-cuda-cupti-cu12
+ Downloading matplotlib
  Downloading numpy
  Downloading sympy
  Downloading nvidia-nvjitlink-cu12
@@ -4071,18 +5882,1340 @@ Downloading numpy (16.2MiB)
  Downloading nvidia-cublas-cu12
  Downloading nvidia-cudnn-cu12
  Downloading torch
-Installed 37 packages in 445ms
+Installed 37 packages in 440ms
 </div>
 </div>
 <div class="cell-artifacts">
 <h4>Artifacts:</h4>
-<a href="artifacts/combine/latency.png" class="artifact" target="_blank">latency.png</a>
+<a href="artifacts/combine/latency.svg" class="artifact" target="_blank">latency.svg</a>
+<a href="artifacts/combine/latency.csv" class="artifact" target="_blank">latency.csv</a>
 <div class="artifact-preview">
-<img src="artifacts/combine/latency.png" alt="latency.png">
+<?xml version='1.0' encoding='utf-8'?>
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:ns2="http://creativecommons.org/ns#" xmlns:ns4="http://www.w3.org/1999/xlink" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" width="864pt" height="576pt" viewBox="0 0 864 576" version="1.1">
+ <metadata>
+  <rdf:RDF>
+   <ns2:Work>
+    <dc:type rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+    <dc:date>2025-10-02T18:12:57.416034</dc:date>
+    <dc:format>image/svg+xml</dc:format>
+    <dc:creator>
+     <ns2:Agent>
+      <dc:title>Matplotlib v3.10.6, https://matplotlib.org/</dc:title>
+     </ns2:Agent>
+    </dc:creator>
+   </ns2:Work>
+  </rdf:RDF>
+ </metadata>
+ <defs>
+  <style type="text/css">*{stroke-linejoin: round; stroke-linecap: butt}</style>
+ </defs>
+ <g id="figure--latency" class="figure">
+  <g id="patch_1">
+   <path d="M 0 576  L 864 576  L 864 0  L 0 0  L 0 576  z " style="fill: none" />
+  </g>
+  <g id="axes--1" class="axes">
+   <g id="patch_2">
+    <path d="M 47.72 502.746298  L 853.2 502.746298  L 853.2 26.88  L 47.72 26.88  L 47.72 502.746298  z " style="fill: none" />
+   </g>
+   <g id="matplotlib.axis_1">
+    <g id="xtick_1">
+     <g id="grid-x--1" class="grid grid-x">
+      <path d="M 84.332727 502.746298  L 84.332727 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_1">
+      <defs>
+       <path id="mafb3703e5b" d="M 0 0  L 0 3.5  " style="stroke: #000000; stroke-width: 0.8" />
+      </defs>
+      <g>
+       <use ns4:href="#mafb3703e5b" x="84.332727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_1">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(69.139323 549.211696) rotate(-45)">flux_L128</text>
+     </g>
+    </g>
+    <g id="xtick_2">
+     <g id="grid-x--2" class="grid grid-x">
+      <path d="M 230.783636 502.746298  L 230.783636 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_2">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="230.783636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_2">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(215.590232 549.211696) rotate(-45)">flux_L256</text>
+     </g>
+    </g>
+    <g id="xtick_3">
+     <g id="grid-x--3" class="grid grid-x">
+      <path d="M 377.234545 502.746298  L 377.234545 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_3">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="377.234545" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_3">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(362.041141 549.211696) rotate(-45)">flux_L320</text>
+     </g>
+    </g>
+    <g id="xtick_4">
+     <g id="grid-x--4" class="grid grid-x">
+      <path d="M 523.685455 502.746298  L 523.685455 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_4">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="523.685455" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_4">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(508.49205 549.211696) rotate(-45)">flux_L384</text>
+     </g>
+    </g>
+    <g id="xtick_5">
+     <g id="grid-x--5" class="grid grid-x">
+      <path d="M 670.136364 502.746298  L 670.136364 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_5">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="670.136364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_5">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(654.942959 549.211696) rotate(-45)">flux_L448</text>
+     </g>
+    </g>
+    <g id="xtick_6">
+     <g id="grid-x--6" class="grid grid-x">
+      <path d="M 816.587273 502.746298  L 816.587273 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_6">
+      <g>
+       <use ns4:href="#mafb3703e5b" x="816.587273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_6">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.393868 549.211696) rotate(-45)">flux_L512</text>
+     </g>
+    </g>
+    <g id="label--x" class="xlabel">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="562.477358" transform="rotate(-0 450.46 562.477358)">Workload</text>
+    </g>
+   </g>
+   <g id="matplotlib.axis_2">
+    <g id="ytick_1">
+     <g id="grid-y--2" class="grid grid-y">
+      <path d="M 47.72 441.595518  L 853.2 441.595518  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_7">
+      <defs>
+       <path id="m0fca2865ba" d="M 0 0  L -3.5 0  " style="stroke: #000000; stroke-width: 0.8" />
+      </defs>
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="441.595518" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_7">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="445.394736" transform="rotate(-0 40.72 445.394736)">0.4</text>
+     </g>
+    </g>
+    <g id="ytick_2">
+     <g id="grid-y--3" class="grid grid-y">
+      <path d="M 47.72 370.372038  L 853.2 370.372038  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_8">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="370.372038" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_8">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="374.171257" transform="rotate(-0 40.72 374.171257)">0.5</text>
+     </g>
+    </g>
+    <g id="ytick_3">
+     <g id="grid-y--4" class="grid grid-y">
+      <path d="M 47.72 299.148559  L 853.2 299.148559  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_9">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="299.148559" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_9">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="302.947777" transform="rotate(-0 40.72 302.947777)">0.6</text>
+     </g>
+    </g>
+    <g id="ytick_4">
+     <g id="grid-y--5" class="grid grid-y">
+      <path d="M 47.72 227.925079  L 853.2 227.925079  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_10">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="227.925079" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_10">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="231.724298" transform="rotate(-0 40.72 231.724298)">0.7</text>
+     </g>
+    </g>
+    <g id="ytick_5">
+     <g id="grid-y--6" class="grid grid-y">
+      <path d="M 47.72 156.7016  L 853.2 156.7016  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_11">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="156.7016" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_11">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="160.500818" transform="rotate(-0 40.72 160.500818)">0.8</text>
+     </g>
+    </g>
+    <g id="ytick_6">
+     <g id="grid-y--7" class="grid grid-y">
+      <path d="M 47.72 85.47812  L 853.2 85.47812  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+     </g>
+     <g id="line2d_12">
+      <g>
+       <use ns4:href="#m0fca2865ba" x="47.72" y="85.47812" style="stroke: #000000; stroke-width: 0.8" />
+      </g>
+     </g>
+     <g id="text_12">
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="89.277339" transform="rotate(-0 40.72 89.277339)">0.9</text>
+     </g>
+    </g>
+    <g id="label--y" class="ylabel">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.737188" y="264.813149" transform="rotate(-90 18.737188 264.813149)">Latency P50 (ms)</text>
+    </g>
+   </g>
+   <g id="series--torch-flash-ma" class="series">
+    <path d="M 84.332727 384.366017  L 230.783636 354.076093  L 377.234545 262.910067  L 523.685455 241.554421  L 670.136364 219.241513  L 816.587273 200.575276  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="md7efaf3aec" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #1f77b4" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#md7efaf3aec" x="84.332727" y="384.366017" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="230.783636" y="354.076093" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="377.234545" y="262.910067" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="523.685455" y="241.554421" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="670.136364" y="219.241513" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="816.587273" y="200.575276" style="fill: #1f77b4; stroke: #1f77b4" />
+    </g>
+   </g>
+   <g id="series--torch-mem-eff" class="series">
+    <path d="M 84.332727 308.082841  L 230.783636 260.858805  L 377.234545 171.903535  L 523.685455 162.057611  L 670.136364 123.220874  L 816.587273 48.510286  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m9b8c54d372" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #ff7f0e" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m9b8c54d372" x="84.332727" y="308.082841" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="230.783636" y="260.858805" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="377.234545" y="171.903535" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="523.685455" y="162.057611" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="670.136364" y="123.220874" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="816.587273" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
+    </g>
+   </g>
+   <g id="series--xformers-meff" class="series">
+    <path d="M 84.332727 406.542164  L 230.783636 391.317445  L 377.234545 297.598728  L 523.685455 298.875063  L 670.136364 270.340104  L 816.587273 266.214825  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="mc655281e0b" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #2ca02c" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#mc655281e0b" x="84.332727" y="406.542164" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="230.783636" y="391.317445" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="377.234545" y="297.598728" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="523.685455" y="298.875063" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="670.136364" y="270.340104" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="816.587273" y="266.214825" style="fill: #2ca02c; stroke: #2ca02c" />
+    </g>
+   </g>
+   <g id="series--torch-flash-compiled-default" class="series">
+    <path d="M 84.332727 350.930872  L 230.783636 329.666414  L 377.234545 237.884954  L 523.685455 216.392568  L 670.136364 197.908664  L 816.587273 174.798074  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m61c8040d7e" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #d62728" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m61c8040d7e" x="84.332727" y="350.930872" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="230.783636" y="329.666414" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="377.234545" y="237.884954" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="523.685455" y="216.392568" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="670.136364" y="197.908664" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="816.587273" y="174.798074" style="fill: #d62728; stroke: #d62728" />
+    </g>
+   </g>
+   <g id="series--torch-flash-compiled-max-autotune" class="series">
+    <path d="M 84.332727 277.998026  L 230.783636 240.665551  L 377.234545 144.963984  L 523.685455 121.192408  L 670.136364 83.290135  L 816.587273 73.786081  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m7cd35be9cc" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #9467bd" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m7cd35be9cc" x="84.332727" y="277.998026" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="230.783636" y="240.665551" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="377.234545" y="144.963984" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="523.685455" y="121.192408" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="670.136364" y="83.290135" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="816.587273" y="73.786081" style="fill: #9467bd; stroke: #9467bd" />
+    </g>
+   </g>
+   <g id="series--hf-kernels-flash-attn" class="series">
+    <path d="M 84.332727 481.116012  L 230.783636 458.415662  L 377.234545 375.272203  L 523.685455 360.207041  L 670.136364 345.438113  L 816.587273 331.284576  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m5dea31a887" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #8c564b" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m5dea31a887" x="84.332727" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="230.783636" y="458.415662" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="377.234545" y="375.272203" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="523.685455" y="360.207041" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="670.136364" y="345.438113" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="816.587273" y="331.284576" style="fill: #8c564b; stroke: #8c564b" />
+    </g>
+   </g>
+   <g id="series--hf-kernels-flash-attn3" class="series">
+    <path d="M 84.332727 468.876956  L 230.783636 448.319013  L 377.234545 353.939354  L 523.685455 352.571874  L 670.136364 323.831785  L 816.587273 320.754912  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <defs>
+     <path id="m67b69c36d7" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #e377c2" />
+    </defs>
+    <g clip-path="url(#p5d73e4651f)">
+     <use ns4:href="#m67b69c36d7" x="84.332727" y="468.876956" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="230.783636" y="448.319013" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="377.234545" y="353.939354" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="523.685455" y="352.571874" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="670.136364" y="323.831785" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="816.587273" y="320.754912" style="fill: #e377c2; stroke: #e377c2" />
+    </g>
+   </g>
+   <g id="patch_3">
+    <path d="M 47.72 502.746298  L 47.72 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_4">
+    <path d="M 853.2 502.746298  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_5">
+    <path d="M 47.72 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="patch_6">
+    <path d="M 47.72 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+   </g>
+   <g id="text_13">
+    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="20.88" transform="rotate(-0 450.46 20.88)">Attention Implementation Latency</text>
+   </g>
+   <g id="legend" class="legend">
+    <g id="patch_7">
+     <path d="M 54.72 139.57375  L 269.259063 139.57375  Q 271.259063 139.57375 271.259063 137.57375  L 271.259063 33.88  Q 271.259063 31.88 269.259063 31.88  L 54.72 31.88  Q 52.72 31.88 52.72 33.88  L 52.72 137.57375  Q 52.72 139.57375 54.72 139.57375  L 54.72 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
+    </g>
+    <g id="line2d_13">
+     <path d="M 56.72 39.978438  L 66.72 39.978438  L 76.72 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#md7efaf3aec" x="66.72" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-ma" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="43.478438" transform="rotate(-0 84.72 43.478438)">torch_flash_ma</text>
+    </g>
+    <g id="line2d_14">
+     <path d="M 56.72 54.934687  L 66.72 54.934687  L 76.72 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m9b8c54d372" x="66.72" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     </g>
+    </g>
+    <g id="legend-label--torch-mem-eff" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="58.434687" transform="rotate(-0 84.72 58.434687)">torch_mem_eff</text>
+    </g>
+    <g id="line2d_15">
+     <path d="M 56.72 69.890938  L 66.72 69.890938  L 76.72 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#mc655281e0b" x="66.72" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
+     </g>
+    </g>
+    <g id="legend-label--xformers-meff" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="73.390938" transform="rotate(-0 84.72 73.390938)">xformers_meff</text>
+    </g>
+    <g id="line2d_16">
+     <path d="M 56.72 84.847188  L 66.72 84.847188  L 76.72 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m61c8040d7e" x="66.72" y="84.847188" style="fill: #d62728; stroke: #d62728" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-compiled-default" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="88.347188" transform="rotate(-0 84.72 88.347188)">torch_flash_compiled_default</text>
+    </g>
+    <g id="line2d_17">
+     <path d="M 56.72 99.803438  L 66.72 99.803438  L 76.72 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m7cd35be9cc" x="66.72" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
+     </g>
+    </g>
+    <g id="legend-label--torch-flash-compiled-max-autotune" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="103.303438" transform="rotate(-0 84.72 103.303438)">torch_flash_compiled_max_autotune</text>
+    </g>
+    <g id="line2d_18">
+     <path d="M 56.72 114.759688  L 66.72 114.759688  L 76.72 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m5dea31a887" x="66.72" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
+     </g>
+    </g>
+    <g id="legend-label--hf-kernels-flash-attn" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="118.259688" transform="rotate(-0 84.72 118.259688)">hf_kernels_flash_attn</text>
+    </g>
+    <g id="line2d_19">
+     <path d="M 56.72 129.715938  L 66.72 129.715938  L 76.72 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+     <g>
+      <use ns4:href="#m67b69c36d7" x="66.72" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
+     </g>
+    </g>
+    <g id="legend-label--hf-kernels-flash-attn3" class="legend">
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="133.215938" transform="rotate(-0 84.72 133.215938)">hf_kernels_flash_attn3</text>
+    </g>
+   </g>
+  </g>
+ </g>
+ <defs>
+  <clipPath id="p5d73e4651f">
+   <rect x="47.72" y="26.88" width="805.48" height="475.866298" />
+  </clipPath>
+ </defs>
+</svg>
 </div>
+<div class="artifact-preview artifact-csv">
+<table class="csv-table">
+<thead><tr>
+<th>Implementation</th>
+<th>Impl ID</th>
+<th>Workload</th>
+<th>Batch</th>
+<th>Seq Length</th>
+<th>Heads</th>
+<th>Head Dim</th>
+<th>Dtype</th>
+<th>Mean (ms)</th>
+<th>P10 (ms)</th>
+<th>P50 (ms)</th>
+<th>P90 (ms)</th>
+<th>Reps</th>
+<th>Peak Mem (MB)</th>
+<th>Backend</th>
+<th>Family</th>
+</tr></thead>
+<tbody>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.48577280044555665</td>
+<td>0.47836801409721375</td>
+<td>0.4803520143032074</td>
+<td>0.4827199876308441</td>
+<td>5</td>
+<td>83.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5229184031486511</td>
+<td>0.521727979183197</td>
+<td>0.5228800177574158</td>
+<td>0.5234559774398804</td>
+<td>5</td>
+<td>90.62</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6515967845916748</td>
+<td>0.6503999829292297</td>
+<td>0.650879979133606</td>
+<td>0.6513599753379822</td>
+<td>5</td>
+<td>95.06</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6807615995407105</td>
+<td>0.6797440052032471</td>
+<td>0.6808639764785767</td>
+<td>0.6815680265426636</td>
+<td>5</td>
+<td>99.88</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.711027193069458</td>
+<td>0.7058879733085632</td>
+<td>0.7121919989585876</td>
+<td>0.7131519913673401</td>
+<td>5</td>
+<td>103.81</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Flash (PyTorch SDPA)</td>
+<td>torch_flash_ma</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7391423940658569</td>
+<td>0.7369279861450195</td>
+<td>0.7383999824523926</td>
+<td>0.7408959865570068</td>
+<td>5</td>
+<td>109.12</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5875647902488709</td>
+<td>0.5863680243492126</td>
+<td>0.5874559879302979</td>
+<td>0.5876479744911194</td>
+<td>5</td>
+<td>83.38</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.653657603263855</td>
+<td>0.6485440135002136</td>
+<td>0.6537600159645081</td>
+<td>0.656544029712677</td>
+<td>5</td>
+<td>90.62</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7784512042999268</td>
+<td>0.774944007396698</td>
+<td>0.778656005859375</td>
+<td>0.7801600098609924</td>
+<td>5</td>
+<td>95.94</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7922943949699401</td>
+<td>0.791263997554779</td>
+<td>0.7924799919128418</td>
+<td>0.7927039861679077</td>
+<td>5</td>
+<td>100.0</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.848089587688446</td>
+<td>0.8444799780845642</td>
+<td>0.8470079898834229</td>
+<td>0.8499199748039246</td>
+<td>5</td>
+<td>103.81</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>MemEff (PyTorch SDPA)</td>
+<td>torch_mem_eff</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9523776054382325</td>
+<td>0.95004802942276</td>
+<td>0.9519039988517761</td>
+<td>0.9541119933128357</td>
+<td>5</td>
+<td>109.12</td>
+<td>EFFICIENT</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.45066879987716674</td>
+<td>0.4474239945411682</td>
+<td>0.44921600818634033</td>
+<td>0.45241600275039673</td>
+<td>5</td>
+<td>83.38</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.47004159688949587</td>
+<td>0.4652479887008667</td>
+<td>0.4705919921398163</td>
+<td>0.4716799855232239</td>
+<td>5</td>
+<td>90.62</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6022783994674683</td>
+<td>0.5987840294837952</td>
+<td>0.6021760106086731</td>
+<td>0.6045759916305542</td>
+<td>5</td>
+<td>95.06</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6013055920600892</td>
+<td>0.6000319719314575</td>
+<td>0.600383996963501</td>
+<td>0.6016640067100525</td>
+<td>5</td>
+<td>99.88</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6408192038536071</td>
+<td>0.639136016368866</td>
+<td>0.6404479742050171</td>
+<td>0.6416320204734802</td>
+<td>5</td>
+<td>103.81</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>xFormers</td>
+<td>xformers_meff</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6466111898422241</td>
+<td>0.6447359919548035</td>
+<td>0.6462399959564209</td>
+<td>0.6483839750289917</td>
+<td>5</td>
+<td>109.12</td>
+<td>memory_efficient</td>
+<td>xformers</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.527347207069397</td>
+<td>0.5194560289382935</td>
+<td>0.5272960066795349</td>
+<td>0.5312960147857666</td>
+<td>5</td>
+<td>83.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5586367964744567</td>
+<td>0.5560640096664429</td>
+<td>0.5571519732475281</td>
+<td>0.5611839890480042</td>
+<td>5</td>
+<td>90.62</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6860736012458801</td>
+<td>0.6841920018196106</td>
+<td>0.6860160231590271</td>
+<td>0.6869760155677795</td>
+<td>5</td>
+<td>95.25</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7167360067367554</td>
+<td>0.7152000069618225</td>
+<td>0.7161920070648193</td>
+<td>0.7164160013198853</td>
+<td>5</td>
+<td>99.88</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7423295855522156</td>
+<td>0.7400959730148315</td>
+<td>0.742143988609314</td>
+<td>0.7431039810180664</td>
+<td>5</td>
+<td>103.81</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (default)</td>
+<td>torch_flash_compiled_default</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.7743871927261352</td>
+<td>0.7718080282211304</td>
+<td>0.7745919823646545</td>
+<td>0.7748159766197205</td>
+<td>5</td>
+<td>109.12</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.6489088058471679</td>
+<td>0.6148160099983215</td>
+<td>0.6296960115432739</td>
+<td>0.6522240042686462</td>
+<td>5</td>
+<td>67.5</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.700761592388153</td>
+<td>0.6615359783172607</td>
+<td>0.6821119785308838</td>
+<td>0.7128959894180298</td>
+<td>5</td>
+<td>75.0</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.834444797039032</td>
+<td>0.7967039942741394</td>
+<td>0.8164799809455872</td>
+<td>0.8463680148124695</td>
+<td>5</td>
+<td>80.38</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.8709375977516174</td>
+<td>0.8432319760322571</td>
+<td>0.8498560190200806</td>
+<td>0.8750079870223999</td>
+<td>5</td>
+<td>82.5</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9069631934165955</td>
+<td>0.8775359988212585</td>
+<td>0.9030719995498657</td>
+<td>0.903872013092041</td>
+<td>5</td>
+<td>86.25</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>Compiled (max-autotune)</td>
+<td>torch_flash_compiled_max_autotune</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.9371584057807922</td>
+<td>0.9145920276641846</td>
+<td>0.9164159893989563</td>
+<td>0.9357439875602722</td>
+<td>5</td>
+<td>90.0</td>
+<td>FLASH</td>
+<td>torch-sdpa</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.34446719884872434</td>
+<td>0.3438720107078552</td>
+<td>0.3445119857788086</td>
+<td>0.34457600116729736</td>
+<td>5</td>
+<td>83.38</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.37571839094161985</td>
+<td>0.37404799461364746</td>
+<td>0.3763839900493622</td>
+<td>0.3766399919986725</td>
+<td>5</td>
+<td>90.62</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.4945920050144196</td>
+<td>0.4925439953804016</td>
+<td>0.493120014667511</td>
+<td>0.4938240051269531</td>
+<td>5</td>
+<td>95.06</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5139647841453552</td>
+<td>0.5123199820518494</td>
+<td>0.5142719745635986</td>
+<td>0.5147839784622192</td>
+<td>5</td>
+<td>99.88</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5353855967521668</td>
+<td>0.5339199900627136</td>
+<td>0.5350080132484436</td>
+<td>0.5352320075035095</td>
+<td>5</td>
+<td>103.81</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn</td>
+<td>hf_kernels_flash_attn</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5548800110816956</td>
+<td>0.5538560152053833</td>
+<td>0.5548800230026245</td>
+<td>0.5553280115127563</td>
+<td>5</td>
+<td>109.12</td>
+<td>flash-attn</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L128</td>
+<td>1</td>
+<td>1152</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.3617343962192535</td>
+<td>0.36102399230003357</td>
+<td>0.3616960048675537</td>
+<td>0.36211198568344116</td>
+<td>5</td>
+<td>83.38</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L256</td>
+<td>1</td>
+<td>1280</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.3907967984676361</td>
+<td>0.3885439932346344</td>
+<td>0.39056000113487244</td>
+<td>0.3906239867210388</td>
+<td>5</td>
+<td>90.62</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L320</td>
+<td>1</td>
+<td>1344</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5228991985321045</td>
+<td>0.521344006061554</td>
+<td>0.5230720043182373</td>
+<td>0.5232319831848145</td>
+<td>5</td>
+<td>95.06</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L384</td>
+<td>1</td>
+<td>1408</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5254656076431274</td>
+<td>0.523904025554657</td>
+<td>0.5249919891357422</td>
+<td>0.526528000831604</td>
+<td>5</td>
+<td>99.88</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L448</td>
+<td>1</td>
+<td>1472</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5646592020988465</td>
+<td>0.5627840161323547</td>
+<td>0.565343976020813</td>
+<td>0.565343976020813</td>
+<td>5</td>
+<td>103.81</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+<tr>
+<td>HF Kernels Flash Attn3</td>
+<td>hf_kernels_flash_attn3</td>
+<td>flux_L512</td>
+<td>1</td>
+<td>1536</td>
+<td>24</td>
+<td>128</td>
+<td>bfloat16</td>
+<td>0.5698879957199097</td>
+<td>0.567359983921051</td>
+<td>0.5696640014648438</td>
+<td>0.5698559880256653</td>
+<td>5</td>
+<td>109.12</td>
+<td>flash-attn3</td>
+<td>hf-kernels</td>
+</tr>
+</tbody>
+</table>
 </div>
 </div>
 </div>
+</div>
+
+<script>
+// Configuration object mapping series IDs to their URLs and descriptions
+const seriesConfig = {
+    'series--torch-flash-ma': {
+        url: '../impls/flash_attention.html',
+        name: 'PyTorch Flash Attention (Math)',
+        description: 'PyTorch built-in scaled dot product attention with math backend'
+    },
+    'series--torch-mem-eff': {
+        url: '../impls/mem_efficient_attention.html',
+        name: 'PyTorch Memory Efficient',
+        description: 'PyTorch memory-efficient attention implementation'
+    },
+    'series--xformers-meff': {
+        url: '../impls/xformers.html',
+        name: 'xFormers Memory Efficient',
+        description: 'Facebook Research xFormers memory-efficient attention'
+    },
+    'series--torch-flash-compiled-default': {
+        url: '../impls/compiled_variants.html',
+        name: 'PyTorch Flash Compiled (Default)',
+        description: 'PyTorch compiled Flash Attention with default settings'
+    },
+    'series--torch-flash-compiled-max-autotune': {
+        url: '../impls/compiled_variants.html',
+        name: 'PyTorch Flash Compiled (Max Autotune)',
+        description: 'PyTorch compiled Flash Attention with maximum auto-tuning'
+    },
+    'series--hf-kernels-flash-attn': {
+        url: '../impls/hf_kernels_flash_attn.html',
+        name: 'HuggingFace Flash Attention',
+        description: 'HuggingFace kernels implementation of Flash Attention'
+    },
+    'series--hf-kernels-flash-attn3': {
+        url: '../impls/hf_kernels_flash_attn3.html',
+        name: 'HuggingFace Flash Attention 3',
+        description: 'HuggingFace kernels implementation of Flash Attention 3'
+    }
+};
+
+// Get tooltip element (create if it doesn't exist)
+let tooltip = document.getElementById('tooltip');
+if (!tooltip) {
+    tooltip = document.createElement('div');
+    tooltip.id = 'tooltip';
+    tooltip.className = 'tooltip';
+    document.body.appendChild(tooltip);
+}
+
+// Add event listeners to each series
+Object.keys(seriesConfig).forEach(seriesId => {
+    const seriesElement = document.getElementById(seriesId);
+    const config = seriesConfig[seriesId];
+
+    if (seriesElement) {
+        // Mouse enter - show tooltip
+        seriesElement.addEventListener('mouseenter', (e) => {
+            tooltip.innerHTML = `
+                <strong>${config.name}</strong><br>
+                <span style="font-size: 12px; opacity: 0.9;">${config.description}</span><br>
+                <span style="font-size: 11px; opacity: 0.7;">Click to view documentation</span>
+            `;
+            tooltip.classList.add('show');
+        });
+
+        // Mouse move - update tooltip position
+        seriesElement.addEventListener('mousemove', (e) => {
+            const rect = document.querySelector('svg').getBoundingClientRect();
+            tooltip.style.left = (e.clientX + 15) + 'px';
+            tooltip.style.top = (e.clientY - 10) + 'px';
+        });
+
+        // Mouse leave - hide tooltip
+        seriesElement.addEventListener('mouseleave', () => {
+            tooltip.classList.remove('show');
+        });
+
+        // Click - open URL in new tab
+        seriesElement.addEventListener('click', (e) => {
+            e.preventDefault();
+            window.open(config.url, '_blank', 'noopener,noreferrer');
+
+            // Optional: Add visual feedback for click
+            seriesElement.style.transform = 'scale(0.98)';
+            setTimeout(() => {
+                seriesElement.style.transform = '';
+            }, 150);
+        });
+
+        // Add cursor pointer style
+        seriesElement.style.cursor = 'pointer';
+    }
+});
+
+// Also add click handlers to legend items
+const legendLabels = document.querySelectorAll('[id^="legend-label--"]');
+legendLabels.forEach(label => {
+    const labelId = label.id.replace('legend-label--', 'series--');
+    const config = seriesConfig[labelId];
+
+    if (config) {
+        label.style.cursor = 'pointer';
+
+        label.addEventListener('click', (e) => {
+            e.preventDefault();
+            window.open(config.url, '_blank', 'noopener,noreferrer');
+        });
+
+        label.addEventListener('mouseenter', (e) => {
+            tooltip.innerHTML = `
+                <strong>${config.name}</strong><br>
+                <span style="font-size: 12px; opacity: 0.9;">${config.description}</span><br>
+                <span style="font-size: 11px; opacity: 0.7;">Click to view documentation</span>
+            `;
+            tooltip.classList.add('show');
+        });
+
+        label.addEventListener('mousemove', (e) => {
+            tooltip.style.left = (e.clientX + 15) + 'px';
+            tooltip.style.top = (e.clientY - 10) + 'px';
+        });
+
+        label.addEventListener('mouseleave', () => {
+            tooltip.classList.remove('show');
+        });
+    }
+});
+
+// Keyboard accessibility - Enter key support
+document.addEventListener('keydown', (e) => {
+    if (e.key === 'Enter' && e.target.closest('[id^="series--"]')) {
+        const seriesId = e.target.closest('[id^="series--"]').id;
+        const config = seriesConfig[seriesId];
+        if (config) {
+            window.open(config.url, '_blank', 'noopener,noreferrer');
+        }
+    }
+});
+
+// Add focus styles for keyboard navigation
+const allInteractiveElements = document.querySelectorAll('[id^="series--"], [id^="legend-label--"]');
+allInteractiveElements.forEach(element => {
+    element.setAttribute('tabindex', '0');
+    element.addEventListener('focus', () => {
+        element.style.outline = '2px solid #007acc';
+        element.style.outlineOffset = '2px';
+    });
+    element.addEventListener('blur', () => {
+        element.style.outline = '';
+        element.style.outlineOffset = '';
+    });
+});
+</script>
     </div>
     
 </body>