diff --git "a/flash_attn/results/combined_results.html" "b/flash_attn/results/combined_results.html"
--- "a/flash_attn/results/combined_results.html"
+++ "b/flash_attn/results/combined_results.html"
@@ -706,6 +706,29 @@
             white-space: pre-wrap;
             color: var(--text-primary);
         }
+
+        .cell-stdout {
+            background: var(--bg-tertiary);
+            padding: 0.75rem;
+            border-radius: 1px;
+            font-family: inherit;
+            font-size: 0.9rem;
+            color: var(--text-primary);
+
+            /* key bits */
+            overflow: auto;          /* show scrollbars when needed */
+            max-width: 100%;         /* respects whatever layout width you give it */
+        }
+
+        .cell-stdout .stdout-text {
+            margin: 0;               /* reset pre default margin */
+            white-space: pre;        /* keep line breaks, NO wrapping */
+            display: inline-block;   /* shrink-to-content */
+            min-width: max-content;  /* allow very long lines to define intrinsic width */
+            font-family: ui-monospace, SFMono-Regular, Menlo, Consolas, monospace;
+            tab-size: 2;
+        }
+
         .cell-stderr {
             background: var(--bg-error);
             border-left: 2px solid var(--border-error);
@@ -1202,174 +1225,7 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
         .line-numbers .line-number { line-height: var(--code-line-height) !important; }
 
         /* Custom CSS from frontmatter */
-        #output-setup {
-    overflow-x: auto;
-}
-.cell-output {
-    overflow: scroll;
-}
-.cell-stdout {
-    width: max-content;
-    overflow: scroll;
-}
-.cell-stderr {
-    width: max-content;
-    overflow: scroll;
-    max-height: 300px;
-}
-svg {
-    max-width: 100%;
-    height: auto;
-    cursor: crosshair;
-}
-
-/* Hover effects for series lines */
-.series path {
-    stroke-width: 6 !important; /* make lines easier to hover */
-    transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
-    filter: drop-shadow(0 2px 4px rgba(0, 0, 0, 0.1));
-}
-
-/* remove border on focus */
-g:focus {
-    outline: none !important;
-}
-
-.series:hover path {
-    stroke-width: 3;
-    filter: drop-shadow(0 4px 8px rgba(0, 0, 0, 0.2));
-    /* transform: translateY(-1px); */
-}
-
-.series:hover circle {
-    r: 5;
-    filter: drop-shadow(0 2px 6px rgba(0, 0, 0, 0.3));
-}
-
-/* Individual series hover colors with glow */
-#series--torch-flash-ma:hover path {
-    stroke: #0066cc;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #1f77b4);
-}
-
-#series--torch-mem-eff:hover path {
-    stroke: #ff6600;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #ff7f0e);
-}
-
-#series--xformers-meff:hover path {
-    stroke: #228833;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #2ca02c);
-}
-
-#series--torch-flash-compiled-default:hover path {
-    stroke: #cc0000;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #d62728);
-}
-
-#series--torch-flash-compiled-max-autotune:hover path {
-    stroke: #7733aa;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #9467bd);
-}
-
-#series--hf-kernels-flash-attn:hover path {
-    stroke: #664422;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #8c564b);
-}
-
-#series--hf-kernels-flash-attn3:hover path {
-    stroke: #cc3399;
-    stroke-width: 4;
-    filter: drop-shadow(0 0 8px #e377c2);
-}
-
-/* Cursor changes */
-.series {
-    cursor: pointer;
-}
-
-.series:hover {
-    cursor: pointer;
-}
-
-/* Tooltip styles */
-.tooltip {
-    position: absolute;
-    background: rgba(0, 0, 0, 0.9);
-    color: white;
-    padding: 12px 16px;
-    border-radius: 8px;
-    font-size: 14px;
-    font-weight: 500;
-    pointer-events: none;
-    opacity: 0;
-    transition: opacity 0.3s ease;
-    z-index: 1000;
-    backdrop-filter: blur(10px);
-    border: 1px solid rgba(255, 255, 255, 0.2);
-    box-shadow: 0 8px 16px rgba(0, 0, 0, 0.3);
-}
-
-.tooltip.show {
-    opacity: 1;
-}
-
-/* Legend hover effects */
-.legend g:hover text {
-    font-weight: bold;
-    fill: #333;
-}
-
-.legend g {
-    cursor: pointer;
-    transition: all 0.2s ease;
-}
-
-.legend g:hover {
-    transform: translateX(5px);
-}
-
-/* Subtle animations */
-@keyframes pulse {
-    0%, 100% { opacity: 1; }
-    50% { opacity: 0.7; }
-}
-
-.series:active path {
-    animation: pulse 0.3s ease;
-}
-
-/* Responsive design */
-@media (max-width: 768px) {
-    .chart-container {
-        padding: 15px;
-        margin: 10px;
-    }
-}
-
-/* Loading animation */
-.chart-container::before {
-    content: '';
-    position: absolute;
-    top: 0;
-    left: 0;
-    right: 0;
-    bottom: 0;
-    background: linear-gradient(90deg, transparent, rgba(255,255,255,0.4), transparent);
-    transform: translateX(-100%);
-    animation: shimmer 2s ease-in-out;
-}
-
-@keyframes shimmer {
-    0% { transform: translateX(-100%); }
-    100% { transform: translateX(100%); }
-}
+        
 
         
         
@@ -3723,7 +3579,12 @@ g:focus {
                 if(output){
                     output.classList.remove('output-stale');
                     let html='';
-                    if(data.stdout) html+='<div class="cell-stdout">'+escapeHtml(data.stdout)+'</div>';
+                    if (data.stdout) {
+                    html += '<div class="cell-stdout"><pre class="stdout-text">'
+                        + escapeHtml(data.stdout)
+                        + '</pre></div>';
+                    }
+
                     console.log('UV Logs:', data);
                     if(data.stderr) {
                         // Split UV logs from regular stderr
@@ -3845,27 +3706,27 @@ g:focus {
             }
         }
 
-        // Live reload functionality (robust SSE handling)
-        (function(){
-            if (!('EventSource' in window)) {
-                console.warn('SSE not supported in this browser');
-                return;
-            }
-            let source = new EventSource('/events');
-            let isOpen = false;
-            source.onopen = function(){ isOpen = true; console.log('SSE connected'); };
-            source.onmessage = function(e){
-                const msg=(e.data||'').trim(); if(!msg) return;
-                console.log('SSE message:', msg);
-                if (msg==='reload' || msg==='incremental') { location.reload(); }
-                // Ignore 'loading' to avoid premature reload loops
-            };
-            source.onerror = function(e){
-                // Let EventSource auto-reconnect instead of forcing a reload
-                if (isOpen) console.warn('SSE error after open, retrying...', e);
-            };
-            window.addEventListener('beforeunload', function(){ try{source.close();}catch(_){} });
-        })();
+        // // Live reload functionality (robust SSE handling)
+        // (function(){
+        //     if (!('EventSource' in window)) {
+        //         console.warn('SSE not supported in this browser');
+        //         return;
+        //     }
+        //     let source = new EventSource('/events');
+        //     let isOpen = false;
+        //     source.onopen = function(){ isOpen = true; console.log('SSE connected'); };
+        //     source.onmessage = function(e){
+        //         const msg=(e.data||'').trim(); if(!msg) return;
+        //         console.log('SSE message:', msg);
+        //         if (msg==='reload' || msg==='incremental') { location.reload(); }
+        //         // Ignore 'loading' to avoid premature reload loops
+        //     };
+        //     source.onerror = function(e){
+        //         // Let EventSource auto-reconnect instead of forcing a reload
+        //         if (isOpen) console.warn('SSE error after open, retrying...', e);
+        //     };
+        //     window.addEventListener('beforeunload', function(){ try{source.close();}catch(_){} });
+        // })();
 
 
         document.addEventListener('DOMContentLoaded', function() {
@@ -3996,15 +3857,12 @@ g:focus {
     <div class="system-info">
         <div class="system-info-header">Generated on:</div>
         <div class="system-info-content">
-            Linux x86_64 | Linux-5.15.0-1084-aws-x86_64-with-glibc2.31
+            Linux x86_64 | Linux-5.10.244-240.970.amzn2.x86_64-x86_64-with-glibc2.35
         </div>
     </div>
     
     <div class="main-content">
         <h1>Flash Attention Benchmarks - Aggregated Results</h1>
-<p>This document combines benchmark results from multiple attention implementations
-using cross-file dependencies.</p>
-<h2>Combined Summary and Visualization</h2>
 <div class="artifact-preview">
 <?xml version='1.0' encoding='utf-8'?>
 <svg xmlns="http://www.w3.org/2000/svg" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:ns2="http://creativecommons.org/ns#" xmlns:ns4="http://www.w3.org/1999/xlink" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" width="864pt" height="576pt" viewBox="0 0 864 576" version="1.1">
@@ -4012,7 +3870,7 @@ using cross-file dependencies.</p>
   <rdf:RDF>
    <ns2:Work>
     <dc:type rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
-    <dc:date>2025-10-14T20:47:15.973248</dc:date>
+    <dc:date>2025-10-23T17:22:40.731286</dc:date>
     <dc:format>image/svg+xml</dc:format>
     <dc:creator>
      <ns2:Agent>
@@ -4025,2774 +3883,524 @@ using cross-file dependencies.</p>
  <defs>
   <style type="text/css">*{stroke-linejoin: round; stroke-linecap: butt}</style>
  </defs>
- <g id="figure--latency" class="figure">
+ <g id="figure--flash-attention" class="figure">
   <g id="patch_1">
    <path d="M 0 576  L 864 576  L 864 0  L 0 0  L 0 576  z " style="fill: none" />
   </g>
   <g id="axes--1" class="axes">
    <g id="patch_2">
-    <path d="M 47.72 502.746298  L 853.2 502.746298  L 853.2 26.88  L 47.72 26.88  L 47.72 502.746298  z " style="fill: none" />
+    <path d="M 54.02 502.746298  L 853.2 502.746298  L 853.2 26.88  L 54.02 26.88  L 54.02 502.746298  z " style="fill: none" />
    </g>
    <g id="matplotlib.axis_1">
     <g id="xtick_1">
      <g id="grid-x--1" class="grid grid-x">
-      <path d="M 84.332727 502.746298  L 84.332727 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 90.346364 502.746298  L 90.346364 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_1">
       <defs>
        <path id="mafb3703e5b" d="M 0 0  L 0 3.5  " style="stroke: #000000; stroke-width: 0.8" />
       </defs>
       <g>
-       <use ns4:href="#mafb3703e5b" x="84.332727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="90.346364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_1">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(69.139323 549.211696) rotate(-45)">flux_L128</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(75.152959 549.211696) rotate(-45)">flux_L128</text>
      </g>
     </g>
     <g id="xtick_2">
      <g id="grid-x--2" class="grid grid-x">
-      <path d="M 230.783636 502.746298  L 230.783636 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 235.651818 502.746298  L 235.651818 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_2">
       <g>
-       <use ns4:href="#mafb3703e5b" x="230.783636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="235.651818" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_2">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(215.590232 549.211696) rotate(-45)">flux_L256</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(220.458414 549.211696) rotate(-45)">flux_L256</text>
      </g>
     </g>
     <g id="xtick_3">
      <g id="grid-x--3" class="grid grid-x">
-      <path d="M 377.234545 502.746298  L 377.234545 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 380.957273 502.746298  L 380.957273 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_3">
       <g>
-       <use ns4:href="#mafb3703e5b" x="377.234545" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="380.957273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_3">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(362.041141 549.211696) rotate(-45)">flux_L320</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(365.763868 549.211696) rotate(-45)">flux_L320</text>
      </g>
     </g>
     <g id="xtick_4">
      <g id="grid-x--4" class="grid grid-x">
-      <path d="M 523.685455 502.746298  L 523.685455 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 526.262727 502.746298  L 526.262727 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_4">
       <g>
-       <use ns4:href="#mafb3703e5b" x="523.685455" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="526.262727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_4">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(508.49205 549.211696) rotate(-45)">flux_L384</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(511.069323 549.211696) rotate(-45)">flux_L384</text>
      </g>
     </g>
     <g id="xtick_5">
      <g id="grid-x--5" class="grid grid-x">
-      <path d="M 670.136364 502.746298  L 670.136364 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 671.568182 502.746298  L 671.568182 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_5">
       <g>
-       <use ns4:href="#mafb3703e5b" x="670.136364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="671.568182" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_5">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(654.942959 549.211696) rotate(-45)">flux_L448</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(656.374777 549.211696) rotate(-45)">flux_L448</text>
      </g>
     </g>
     <g id="xtick_6">
      <g id="grid-x--6" class="grid grid-x">
-      <path d="M 816.587273 502.746298  L 816.587273 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 816.873636 502.746298  L 816.873636 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_6">
       <g>
-       <use ns4:href="#mafb3703e5b" x="816.587273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="816.873636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_6">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.393868 549.211696) rotate(-45)">flux_L512</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.680232 549.211696) rotate(-45)">flux_L512</text>
      </g>
     </g>
     <g id="label--x" class="xlabel">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="562.477358" transform="rotate(-0 450.46 562.477358)">Workload</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="453.61" y="562.477358" transform="rotate(-0 453.61 562.477358)">Workload</text>
     </g>
    </g>
    <g id="matplotlib.axis_2">
     <g id="ytick_1">
      <g id="grid-y--2" class="grid grid-y">
-      <path d="M 47.72 450.141334  L 853.2 450.141334  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 415.772525  L 853.2 415.772525  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_7">
       <defs>
        <path id="m0fca2865ba" d="M 0 0  L -3.5 0  " style="stroke: #000000; stroke-width: 0.8" />
       </defs>
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="450.141334" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="415.772525" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_7">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="453.940552" transform="rotate(-0 40.72 453.940552)">0.3</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="419.571744" transform="rotate(-0 47.02 419.571744)">0.15</text>
      </g>
     </g>
     <g id="ytick_2">
      <g id="grid-y--3" class="grid grid-y">
-      <path d="M 47.72 393.135521  L 853.2 393.135521  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 319.40707  L 853.2 319.40707  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_8">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="393.135521" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="319.40707" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_8">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="396.934739" transform="rotate(-0 40.72 396.934739)">0.4</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="323.206289" transform="rotate(-0 47.02 323.206289)">0.20</text>
      </g>
     </g>
     <g id="ytick_3">
      <g id="grid-y--4" class="grid grid-y">
-      <path d="M 47.72 336.129707  L 853.2 336.129707  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 223.041616  L 853.2 223.041616  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_9">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="336.129707" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="223.041616" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_9">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="339.928926" transform="rotate(-0 40.72 339.928926)">0.5</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="226.840834" transform="rotate(-0 47.02 226.840834)">0.25</text>
      </g>
     </g>
     <g id="ytick_4">
      <g id="grid-y--5" class="grid grid-y">
-      <path d="M 47.72 279.123894  L 853.2 279.123894  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 126.676161  L 853.2 126.676161  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_10">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="279.123894" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="126.676161" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_10">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="282.923113" transform="rotate(-0 40.72 282.923113)">0.6</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="130.47538" transform="rotate(-0 47.02 130.47538)">0.30</text>
      </g>
     </g>
     <g id="ytick_5">
      <g id="grid-y--6" class="grid grid-y">
-      <path d="M 47.72 222.118081  L 853.2 222.118081  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 30.310707  L 853.2 30.310707  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_11">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="222.118081" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="30.310707" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_11">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="225.9173" transform="rotate(-0 40.72 225.9173)">0.7</text>
-     </g>
-    </g>
-    <g id="ytick_6">
-     <g id="grid-y--7" class="grid grid-y">
-      <path d="M 47.72 165.112268  L 853.2 165.112268  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_12">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="165.112268" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_12">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="168.911487" transform="rotate(-0 40.72 168.911487)">0.8</text>
-     </g>
-    </g>
-    <g id="ytick_7">
-     <g id="grid-y--8" class="grid grid-y">
-      <path d="M 47.72 108.106455  L 853.2 108.106455  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_13">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="108.106455" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_13">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="111.905674" transform="rotate(-0 40.72 111.905674)">0.9</text>
-     </g>
-    </g>
-    <g id="ytick_8">
-     <g id="grid-y--9" class="grid grid-y">
-      <path d="M 47.72 51.100642  L 853.2 51.100642  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_14">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="51.100642" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_14">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="54.89986" transform="rotate(-0 40.72 54.89986)">1.0</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="34.109925" transform="rotate(-0 47.02 34.109925)">0.35</text>
      </g>
     </g>
     <g id="label--y" class="ylabel">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.737188" y="264.813149" transform="rotate(-90 18.737188 264.813149)">Latency P50 (ms)</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.674687" y="264.813149" transform="rotate(-90 18.674687 264.813149)">Latency P50 (ms)</text>
     </g>
    </g>
    <g id="series--torch-flash-ma" class="series">
-    <path d="M 84.332727 388.830439  L 230.783636 322.86788  L 377.234545 309.441871  L 523.685455 285.508538  L 670.136364 253.91365  L 816.587273 232.971988  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 356.83734  L 235.651818 302.774393  L 380.957273 272.879902  L 526.262727 285.428611  L 671.568182 180.710199  L 816.873636 163.520529  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="md7efaf3aec" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #1f77b4" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#md7efaf3aec" x="84.332727" y="388.830439" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="230.783636" y="322.86788" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="377.234545" y="309.441871" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="523.685455" y="285.508538" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="670.136364" y="253.91365" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="816.587273" y="232.971988" style="fill: #1f77b4; stroke: #1f77b4" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#md7efaf3aec" x="90.346364" y="356.83734" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="235.651818" y="302.774393" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="380.957273" y="272.879902" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="526.262727" y="285.428611" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="671.568182" y="180.710199" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="816.873636" y="163.520529" style="fill: #1f77b4; stroke: #1f77b4" />
     </g>
    </g>
    <g id="series--torch-mem-eff" class="series">
-    <path d="M 84.332727 345.633708  L 230.783636 263.910181  L 377.234545 221.880921  L 523.685455 146.578526  L 670.136364 78.864769  L 816.587273 48.510286  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 263.031352  L 235.651818 201.604157  L 380.957273 165.291726  L 526.262727 162.400762  L 671.568182 135.418435  L 816.873636 48.510286  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m9b8c54d372" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #ff7f0e" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m9b8c54d372" x="84.332727" y="345.633708" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="230.783636" y="263.910181" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="377.234545" y="221.880921" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="523.685455" y="146.578526" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="670.136364" y="78.864769" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="816.587273" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m9b8c54d372" x="90.346364" y="263.031352" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="235.651818" y="201.604157" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="380.957273" y="165.291726" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="526.262727" y="162.400762" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="671.568182" y="135.418435" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="816.873636" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
     </g>
    </g>
    <g id="series--xformers-meff" class="series">
-    <path d="M 84.332727 423.854806  L 230.783636 385.838768  L 377.234545 374.236959  L 523.685455 368.271864  L 670.136364 350.303626  L 816.587273 336.29389  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 325.844283  L 235.651818 302.986397  L 380.957273 280.880162  L 526.262727 283.327844  L 671.568182 172.480589  L 816.873636 176.915327  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="mc655281e0b" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #2ca02c" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#mc655281e0b" x="84.332727" y="423.854806" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="230.783636" y="385.838768" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="377.234545" y="374.236959" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="523.685455" y="368.271864" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="670.136364" y="350.303626" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="816.587273" y="336.29389" style="fill: #2ca02c; stroke: #2ca02c" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#mc655281e0b" x="90.346364" y="325.844283" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="235.651818" y="302.986397" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="380.957273" y="280.880162" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="526.262727" y="283.327844" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="671.568182" y="172.480589" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="816.873636" y="176.915327" style="fill: #2ca02c; stroke: #2ca02c" />
     </g>
    </g>
    <g id="series--torch-flash-compiled-default" class="series">
-    <path d="M 84.332727 416.266202  L 230.783636 338.045105  L 377.234545 315.26103  L 523.685455 286.603041  L 670.136364 272.666272  L 816.587273 254.570345  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 316.922768  L 235.651818 262.221882  L 380.957273 251.872232  L 526.262727 244.62555  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m61c8040d7e" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #d62728" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m61c8040d7e" x="84.332727" y="416.266202" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="230.783636" y="338.045105" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="377.234545" y="315.26103" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="523.685455" y="286.603041" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="670.136364" y="272.666272" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="816.587273" y="254.570345" style="fill: #d62728; stroke: #d62728" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m61c8040d7e" x="90.346364" y="316.922768" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="235.651818" y="262.221882" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="380.957273" y="251.872232" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="526.262727" y="244.62555" style="fill: #d62728; stroke: #d62728" />
     </g>
    </g>
    <g id="series--torch-flash-compiled-max-autotune" class="series">
-    <path d="M 84.332727 406.342623  L 230.783636 308.219678  L 377.234545 270.915041  L 523.685455 245.814254  L 670.136364 221.315423  L 816.587273 190.340772  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 338.660888  L 235.651818 322.876226  L 380.957273 301.155453  L 526.262727 294.024409  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m7cd35be9cc" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #9467bd" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m7cd35be9cc" x="84.332727" y="406.342623" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="230.783636" y="308.219678" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="377.234545" y="270.915041" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="523.685455" y="245.814254" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="670.136364" y="221.315423" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="816.587273" y="190.340772" style="fill: #9467bd; stroke: #9467bd" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m7cd35be9cc" x="90.346364" y="338.660888" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="235.651818" y="322.876226" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="380.957273" y="301.155453" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="526.262727" y="294.024409" style="fill: #9467bd; stroke: #9467bd" />
     </g>
    </g>
    <g id="series--hf-kernels-flash-attn" class="series">
-    <path d="M 84.332727 481.116012  L 230.783636 439.032047  L 377.234545 428.524724  L 523.685455 422.103591  L 670.136364 402.840193  L 816.587273 378.906877  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 481.116012  L 235.651818 443.589377  L 380.957273 429.674205  L 526.262727 424.217993  L 671.568182 324.726443  L 816.873636 319.599801  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m5dea31a887" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #8c564b" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m5dea31a887" x="84.332727" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="230.783636" y="439.032047" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="377.234545" y="428.524724" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="523.685455" y="422.103591" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="670.136364" y="402.840193" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="816.587273" y="378.906877" style="fill: #8c564b; stroke: #8c564b" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m5dea31a887" x="90.346364" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="235.651818" y="443.589377" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="380.957273" y="429.674205" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="526.262727" y="424.217993" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="671.568182" y="324.726443" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="816.873636" y="319.599801" style="fill: #8c564b; stroke: #8c564b" />
     </g>
    </g>
    <g id="series--hf-kernels-flash-attn3" class="series">
-    <path d="M 84.332727 464.041637  L 230.783636 427.357253  L 377.234545 415.682458  L 523.685455 408.075608  L 670.136364 392.296394  L 816.587273 376.517179  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 447.09708  L 235.651818 414.602648  L 380.957273 398.006589  L 526.262727 395.346903  L 671.568182 297.898301  L 816.873636 291.692366  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m67b69c36d7" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #e377c2" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m67b69c36d7" x="84.332727" y="464.041637" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="230.783636" y="427.357253" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="377.234545" y="415.682458" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="523.685455" y="408.075608" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="670.136364" y="392.296394" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="816.587273" y="376.517179" style="fill: #e377c2; stroke: #e377c2" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m67b69c36d7" x="90.346364" y="447.09708" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="235.651818" y="414.602648" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="380.957273" y="398.006589" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="526.262727" y="395.346903" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="671.568182" y="297.898301" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="816.873636" y="291.692366" style="fill: #e377c2; stroke: #e377c2" />
     </g>
    </g>
    <g id="patch_3">
-    <path d="M 47.72 502.746298  L 47.72 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 502.746298  L 54.02 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_4">
     <path d="M 853.2 502.746298  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_5">
-    <path d="M 47.72 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_6">
-    <path d="M 47.72 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
-   <g id="text_15">
-    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="20.88" transform="rotate(-0 450.46 20.88)">Attention Implementation Latency</text>
+   <g id="text_12">
+    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="453.61" y="20.88" transform="rotate(-0 453.61 20.88)">Attention Implementation Latency</text>
    </g>
    <g id="legend" class="legend">
     <g id="patch_7">
-     <path d="M 54.72 139.57375  L 269.259063 139.57375  Q 271.259063 139.57375 271.259063 137.57375  L 271.259063 33.88  Q 271.259063 31.88 269.259063 31.88  L 54.72 31.88  Q 52.72 31.88 52.72 33.88  L 52.72 137.57375  Q 52.72 139.57375 54.72 139.57375  L 54.72 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
+     <path d="M 61.02 139.57375  L 275.559062 139.57375  Q 277.559062 139.57375 277.559062 137.57375  L 277.559062 33.88  Q 277.559062 31.88 275.559062 31.88  L 61.02 31.88  Q 59.02 31.88 59.02 33.88  L 59.02 137.57375  Q 59.02 139.57375 61.02 139.57375  L 61.02 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
     </g>
-    <g id="line2d_15">
-     <path d="M 56.72 39.978438  L 66.72 39.978438  L 76.72 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_12">
+     <path d="M 63.02 39.978438  L 73.02 39.978438  L 83.02 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#md7efaf3aec" x="66.72" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
+      <use ns4:href="#md7efaf3aec" x="73.02" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
      </g>
     </g>
     <g id="legend-label--torch-flash-ma" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="43.478438" transform="rotate(-0 84.72 43.478438)">torch_flash_ma</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="43.478438" transform="rotate(-0 91.02 43.478438)">torch_flash_ma</text>
     </g>
-    <g id="line2d_16">
-     <path d="M 56.72 54.934687  L 66.72 54.934687  L 76.72 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_13">
+     <path d="M 63.02 54.934687  L 73.02 54.934687  L 83.02 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m9b8c54d372" x="66.72" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
+      <use ns4:href="#m9b8c54d372" x="73.02" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
      </g>
     </g>
     <g id="legend-label--torch-mem-eff" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="58.434687" transform="rotate(-0 84.72 58.434687)">torch_mem_eff</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="58.434687" transform="rotate(-0 91.02 58.434687)">torch_mem_eff</text>
     </g>
-    <g id="line2d_17">
-     <path d="M 56.72 69.890938  L 66.72 69.890938  L 76.72 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_14">
+     <path d="M 63.02 69.890938  L 73.02 69.890938  L 83.02 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#mc655281e0b" x="66.72" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
+      <use ns4:href="#mc655281e0b" x="73.02" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
      </g>
     </g>
     <g id="legend-label--xformers-meff" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="73.390938" transform="rotate(-0 84.72 73.390938)">xformers_meff</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="73.390938" transform="rotate(-0 91.02 73.390938)">xformers_meff</text>
     </g>
-    <g id="line2d_18">
-     <path d="M 56.72 84.847188  L 66.72 84.847188  L 76.72 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_15">
+     <path d="M 63.02 84.847188  L 73.02 84.847188  L 83.02 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m61c8040d7e" x="66.72" y="84.847188" style="fill: #d62728; stroke: #d62728" />
+      <use ns4:href="#m61c8040d7e" x="73.02" y="84.847188" style="fill: #d62728; stroke: #d62728" />
      </g>
     </g>
     <g id="legend-label--torch-flash-compiled-default" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="88.347188" transform="rotate(-0 84.72 88.347188)">torch_flash_compiled_default</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="88.347188" transform="rotate(-0 91.02 88.347188)">torch_flash_compiled_default</text>
     </g>
-    <g id="line2d_19">
-     <path d="M 56.72 99.803438  L 66.72 99.803438  L 76.72 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_16">
+     <path d="M 63.02 99.803438  L 73.02 99.803438  L 83.02 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m7cd35be9cc" x="66.72" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
+      <use ns4:href="#m7cd35be9cc" x="73.02" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
      </g>
     </g>
     <g id="legend-label--torch-flash-compiled-max-autotune" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="103.303438" transform="rotate(-0 84.72 103.303438)">torch_flash_compiled_max_autotune</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="103.303438" transform="rotate(-0 91.02 103.303438)">torch_flash_compiled_max_autotune</text>
     </g>
-    <g id="line2d_20">
-     <path d="M 56.72 114.759688  L 66.72 114.759688  L 76.72 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_17">
+     <path d="M 63.02 114.759688  L 73.02 114.759688  L 83.02 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m5dea31a887" x="66.72" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
+      <use ns4:href="#m5dea31a887" x="73.02" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
      </g>
     </g>
     <g id="legend-label--hf-kernels-flash-attn" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="118.259688" transform="rotate(-0 84.72 118.259688)">hf_kernels_flash_attn</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="118.259688" transform="rotate(-0 91.02 118.259688)">hf_kernels_flash_attn</text>
     </g>
-    <g id="line2d_21">
-     <path d="M 56.72 129.715938  L 66.72 129.715938  L 76.72 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_18">
+     <path d="M 63.02 129.715938  L 73.02 129.715938  L 83.02 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m67b69c36d7" x="66.72" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
+      <use ns4:href="#m67b69c36d7" x="73.02" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
      </g>
     </g>
     <g id="legend-label--hf-kernels-flash-attn3" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="133.215938" transform="rotate(-0 84.72 133.215938)">hf_kernels_flash_attn3</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="133.215938" transform="rotate(-0 91.02 133.215938)">hf_kernels_flash_attn3</text>
     </g>
    </g>
   </g>
  </g>
  <defs>
-  <clipPath id="p5d73e4651f">
-   <rect x="47.72" y="26.88" width="805.48" height="475.866298" />
+  <clipPath id="p19de80d412">
+   <rect x="54.02" y="26.88" width="799.18" height="475.866298" />
   </clipPath>
  </defs>
 </svg>
 </div>
 
-<div class="artifact-preview artifact-csv">
-<table class="csv-table">
-<thead><tr>
-<th>Implementation</th>
-<th>Impl ID</th>
-<th>Workload</th>
-<th>Batch</th>
-<th>Seq Length</th>
-<th>Heads</th>
-<th>Head Dim</th>
-<th>Dtype</th>
-<th>Mean (ms)</th>
-<th>P10 (ms)</th>
-<th>P50 (ms)</th>
-<th>P90 (ms)</th>
-<th>Reps</th>
-<th>Peak Mem (MB)</th>
-<th>Backend</th>
-<th>Family</th>
-</tr></thead>
-<tbody>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.407123202085495</td>
-<td>0.40537598729133606</td>
-<td>0.40755200386047363</td>
-<td>0.407584011554718</td>
-<td>5</td>
-<td>83.38</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5235007882118226</td>
-<td>0.5212159752845764</td>
-<td>0.5232639908790588</td>
-<td>0.523360013961792</td>
-<td>5</td>
-<td>90.62</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.545849597454071</td>
-<td>0.5418559908866882</td>
-<td>0.5468159914016724</td>
-<td>0.5469120144844055</td>
-<td>5</td>
-<td>95.06</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5892416119575501</td>
-<td>0.5867519974708557</td>
-<td>0.5888000130653381</td>
-<td>0.5888000130653381</td>
-<td>5</td>
-<td>99.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6449280023574829</td>
-<td>0.6430720090866089</td>
-<td>0.6442239880561829</td>
-<td>0.6450240015983582</td>
-<td>5</td>
-<td>103.81</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6823423862457275</td>
-<td>0.6777600049972534</td>
-<td>0.6809599995613098</td>
-<td>0.6818559765815735</td>
-<td>5</td>
-<td>109.12</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.48371200561523436</td>
-<td>0.4821760058403015</td>
-<td>0.4833280146121979</td>
-<td>0.4853760004043579</td>
-<td>5</td>
-<td>83.38</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6268800020217895</td>
-<td>0.6246399879455566</td>
-<td>0.6266880035400391</td>
-<td>0.6286720037460327</td>
-<td>5</td>
-<td>90.62</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.699776005744934</td>
-<td>0.6973440051078796</td>
-<td>0.7004160284996033</td>
-<td>0.7004479765892029</td>
-<td>5</td>
-<td>95.94</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.8333312034606933</td>
-<td>0.8284159898757935</td>
-<td>0.8325120210647583</td>
-<td>0.8376320004463196</td>
-<td>5</td>
-<td>100.0</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.9533439993858337</td>
-<td>0.9502720236778259</td>
-<td>0.9512959718704224</td>
-<td>0.9572479724884033</td>
-<td>5</td>
-<td>103.81</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>1.0066367864608765</td>
-<td>1.0024960041046143</td>
-<td>1.0045440196990967</td>
-<td>1.0097919702529907</td>
-<td>5</td>
-<td>109.12</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3452928066253662</td>
-<td>0.3389439880847931</td>
-<td>0.3461120128631592</td>
-<td>0.3461120128631592</td>
-<td>5</td>
-<td>83.38</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.41234560012817384</td>
-<td>0.40959998965263367</td>
-<td>0.41280001401901245</td>
-<td>0.41286399960517883</td>
-<td>5</td>
-<td>90.62</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4366208016872406</td>
-<td>0.4310399889945984</td>
-<td>0.4331519901752472</td>
-<td>0.4362240135669708</td>
-<td>5</td>
-<td>95.06</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4450624048709869</td>
-<td>0.4359680116176605</td>
-<td>0.44361600279808044</td>
-<td>0.447488009929657</td>
-<td>5</td>
-<td>99.88</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4750400006771088</td>
-<td>0.4711039960384369</td>
-<td>0.47513601183891296</td>
-<td>0.4763199985027313</td>
-<td>5</td>
-<td>103.81</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5009407997131348</td>
-<td>0.49663999676704407</td>
-<td>0.4997119903564453</td>
-<td>0.5038080215454102</td>
-<td>5</td>
-<td>109.12</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3856383919715881</td>
-<td>0.3563520014286041</td>
-<td>0.35942399501800537</td>
-<td>0.3624959886074066</td>
-<td>5</td>
-<td>83.38</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4982912003993988</td>
-<td>0.4926080107688904</td>
-<td>0.49663999676704407</td>
-<td>0.5017600059509277</td>
-<td>5</td>
-<td>90.62</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5369919896125793</td>
-<td>0.5335040092468262</td>
-<td>0.5366079807281494</td>
-<td>0.5386239886283875</td>
-<td>5</td>
-<td>95.25</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5841408014297486</td>
-<td>0.5775359869003296</td>
-<td>0.5868800282478333</td>
-<td>0.5877760052680969</td>
-<td>5</td>
-<td>99.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6184704065322876</td>
-<td>0.6072319746017456</td>
-<td>0.6113280057907104</td>
-<td>0.6144000291824341</td>
-<td>5</td>
-<td>103.81</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6428672075271606</td>
-<td>0.6399999856948853</td>
-<td>0.6430720090866089</td>
-<td>0.6430720090866089</td>
-<td>5</td>
-<td>109.12</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.40020479559898375</td>
-<td>0.3665919899940491</td>
-<td>0.3768320083618164</td>
-<td>0.41171199083328247</td>
-<td>5</td>
-<td>81.75</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5535807967185974</td>
-<td>0.5160959959030151</td>
-<td>0.5489599704742432</td>
-<td>0.5631359815597534</td>
-<td>5</td>
-<td>92.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6143999934196472</td>
-<td>0.562175989151001</td>
-<td>0.6144000291824341</td>
-<td>0.6318079829216003</td>
-<td>5</td>
-<td>95.13</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6754495978355408</td>
-<td>0.6512640118598938</td>
-<td>0.6584320068359375</td>
-<td>0.6799359917640686</td>
-<td>5</td>
-<td>97.13</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.7210752129554748</td>
-<td>0.6973119974136353</td>
-<td>0.7014080286026001</td>
-<td>0.7229440212249756</td>
-<td>5</td>
-<td>99.0</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.7735359907150269</td>
-<td>0.7485439777374268</td>
-<td>0.7557439804077148</td>
-<td>0.7710719704627991</td>
-<td>5</td>
-<td>101.63</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.2456959992647171</td>
-<td>0.24371199309825897</td>
-<td>0.24566400051116943</td>
-<td>0.2457599937915802</td>
-<td>5</td>
-<td>83.38</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3215551972389221</td>
-<td>0.3164159953594208</td>
-<td>0.319487988948822</td>
-<td>0.32051199674606323</td>
-<td>5</td>
-<td>90.62</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3384703993797302</td>
-<td>0.33670398592948914</td>
-<td>0.33792001008987427</td>
-<td>0.33983999490737915</td>
-<td>5</td>
-<td>95.06</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3510208010673523</td>
-<td>0.3481599986553192</td>
-<td>0.3491840064525604</td>
-<td>0.35225600004196167</td>
-<td>5</td>
-<td>99.88</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3829823970794678</td>
-<td>0.38095998764038086</td>
-<td>0.3829759955406189</td>
-<td>0.3840000033378601</td>
-<td>5</td>
-<td>103.81</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4259391903877258</td>
-<td>0.4227519929409027</td>
-<td>0.4249599874019623</td>
-<td>0.4259839951992035</td>
-<td>5</td>
-<td>109.12</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.2755008041858673</td>
-<td>0.26736000180244446</td>
-<td>0.27561599016189575</td>
-<td>0.27955201268196106</td>
-<td>5</td>
-<td>83.38</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3397440016269684</td>
-<td>0.3368000090122223</td>
-<td>0.3399679958820343</td>
-<td>0.34191998839378357</td>
-<td>5</td>
-<td>90.62</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.36019839644432067</td>
-<td>0.3563520014286041</td>
-<td>0.3604480028152466</td>
-<td>0.36137598752975464</td>
-<td>5</td>
-<td>95.06</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.37342079877853396</td>
-<td>0.3718400001525879</td>
-<td>0.37379199266433716</td>
-<td>0.3746879994869232</td>
-<td>5</td>
-<td>99.88</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4024448037147522</td>
-<td>0.3993600010871887</td>
-<td>0.4014720022678375</td>
-<td>0.4034560024738312</td>
-<td>5</td>
-<td>103.81</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4305088043212891</td>
-<td>0.4270080029964447</td>
-<td>0.4291520118713379</td>
-<td>0.4331519901752472</td>
-<td>5</td>
-<td>109.12</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-</tbody>
-</table>
-</div>
-
 <div class="cell" id="cell-combine">
 <div class="cell-header">
 <span class="collapse-indicators">
-<span onclick="toggleCode('combine')" style="cursor: pointer;">▶ code</span> 
-<span onclick="toggleOutput('combine')" style="cursor: pointer;">▶ output</span>
+<span onclick="toggleCode('combine')" style="cursor: pointer;">▼ code</span> 
+<span onclick="toggleOutput('combine')" style="cursor: pointer;">▼ output</span>
  <span id="uv-indicator-combine" onclick="toggleUvLogsFromHeader('combine')" style="cursor: pointer;">▶ uv-logs</span>
 </span> | 
-Cell: combine | 34.17s
+Cell: combine | 4.10s
  | <button class="run-btn" onclick="runCell('combine')">▶ run</button>
 <button class="copy-btn" onclick="copyCell('combine')">Copy</button>
 <a href="cells/combine.py" target="_blank" class="raw-btn">Raw</a>
 </div>
-<div id="code-combine" class="cell-code collapsed" data-lines="319">
-<div class="highlight-with-lines">
-<div class="line-numbers" id="lines-combine">
-<a class="line-number" data-cell="combine" data-line="1" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 1, true);">1</a>
-<a class="line-number" data-cell="combine" data-line="2" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 2, true);">2</a>
-<a class="line-number" data-cell="combine" data-line="3" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 3, true);">3</a>
-<a class="line-number" data-cell="combine" data-line="4" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 4, true);">4</a>
-<a class="line-number" data-cell="combine" data-line="5" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 5, true);">5</a>
-<a class="line-number" data-cell="combine" data-line="6" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 6, true);">6</a>
-<a class="line-number" data-cell="combine" data-line="7" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 7, true);">7</a>
-<a class="line-number" data-cell="combine" data-line="8" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 8, true);">8</a>
-<a class="line-number" data-cell="combine" data-line="9" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 9, true);">9</a>
-<a class="line-number" data-cell="combine" data-line="10" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 10, true);">10</a>
-<a class="line-number" data-cell="combine" data-line="11" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 11, true);">11</a>
-<a class="line-number" data-cell="combine" data-line="12" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 12, true);">12</a>
-<a class="line-number" data-cell="combine" data-line="13" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 13, true);">13</a>
-<a class="line-number" data-cell="combine" data-line="14" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 14, true);">14</a>
-<a class="line-number" data-cell="combine" data-line="15" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 15, true);">15</a>
-<a class="line-number" data-cell="combine" data-line="16" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 16, true);">16</a>
-<a class="line-number" data-cell="combine" data-line="17" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 17, true);">17</a>
-<a class="line-number" data-cell="combine" data-line="18" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 18, true);">18</a>
-<a class="line-number" data-cell="combine" data-line="19" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 19, true);">19</a>
-<a class="line-number" data-cell="combine" data-line="20" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 20, true);">20</a>
-<a class="line-number" data-cell="combine" data-line="21" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 21, true);">21</a>
-<a class="line-number" data-cell="combine" data-line="22" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 22, true);">22</a>
-<a class="line-number" data-cell="combine" data-line="23" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 23, true);">23</a>
-<a class="line-number" data-cell="combine" data-line="24" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 24, true);">24</a>
-<a class="line-number" data-cell="combine" data-line="25" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 25, true);">25</a>
-<a class="line-number" data-cell="combine" data-line="26" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 26, true);">26</a>
-<a class="line-number" data-cell="combine" data-line="27" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 27, true);">27</a>
-<a class="line-number" data-cell="combine" data-line="28" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 28, true);">28</a>
-<a class="line-number" data-cell="combine" data-line="29" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 29, true);">29</a>
-<a class="line-number" data-cell="combine" data-line="30" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 30, true);">30</a>
-<a class="line-number" data-cell="combine" data-line="31" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 31, true);">31</a>
-<a class="line-number" data-cell="combine" data-line="32" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 32, true);">32</a>
-<a class="line-number" data-cell="combine" data-line="33" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 33, true);">33</a>
-<a class="line-number" data-cell="combine" data-line="34" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 34, true);">34</a>
-<a class="line-number" data-cell="combine" data-line="35" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 35, true);">35</a>
-<a class="line-number" data-cell="combine" data-line="36" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 36, true);">36</a>
-<a class="line-number" data-cell="combine" data-line="37" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 37, true);">37</a>
-<a class="line-number" data-cell="combine" data-line="38" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 38, true);">38</a>
-<a class="line-number" data-cell="combine" data-line="39" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 39, true);">39</a>
-<a class="line-number" data-cell="combine" data-line="40" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 40, true);">40</a>
-<a class="line-number" data-cell="combine" data-line="41" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 41, true);">41</a>
-<a class="line-number" data-cell="combine" data-line="42" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 42, true);">42</a>
-<a class="line-number" data-cell="combine" data-line="43" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 43, true);">43</a>
-<a class="line-number" data-cell="combine" data-line="44" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 44, true);">44</a>
-<a class="line-number" data-cell="combine" data-line="45" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 45, true);">45</a>
-<a class="line-number" data-cell="combine" data-line="46" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 46, true);">46</a>
-<a class="line-number" data-cell="combine" data-line="47" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 47, true);">47</a>
-<a class="line-number" data-cell="combine" data-line="48" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 48, true);">48</a>
-<a class="line-number" data-cell="combine" data-line="49" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 49, true);">49</a>
-<a class="line-number" data-cell="combine" data-line="50" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 50, true);">50</a>
-<a class="line-number" data-cell="combine" data-line="51" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 51, true);">51</a>
-<a class="line-number" data-cell="combine" data-line="52" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 52, true);">52</a>
-<a class="line-number" data-cell="combine" data-line="53" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 53, true);">53</a>
-<a class="line-number" data-cell="combine" data-line="54" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 54, true);">54</a>
-<a class="line-number" data-cell="combine" data-line="55" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 55, true);">55</a>
-<a class="line-number" data-cell="combine" data-line="56" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 56, true);">56</a>
-<a class="line-number" data-cell="combine" data-line="57" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 57, true);">57</a>
-<a class="line-number" data-cell="combine" data-line="58" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 58, true);">58</a>
-<a class="line-number" data-cell="combine" data-line="59" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 59, true);">59</a>
-<a class="line-number" data-cell="combine" data-line="60" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 60, true);">60</a>
-<a class="line-number" data-cell="combine" data-line="61" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 61, true);">61</a>
-<a class="line-number" data-cell="combine" data-line="62" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 62, true);">62</a>
-<a class="line-number" data-cell="combine" data-line="63" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 63, true);">63</a>
-<a class="line-number" data-cell="combine" data-line="64" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 64, true);">64</a>
-<a class="line-number" data-cell="combine" data-line="65" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 65, true);">65</a>
-<a class="line-number" data-cell="combine" data-line="66" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 66, true);">66</a>
-<a class="line-number" data-cell="combine" data-line="67" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 67, true);">67</a>
-<a class="line-number" data-cell="combine" data-line="68" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 68, true);">68</a>
-<a class="line-number" data-cell="combine" data-line="69" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 69, true);">69</a>
-<a class="line-number" data-cell="combine" data-line="70" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 70, true);">70</a>
-<a class="line-number" data-cell="combine" data-line="71" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 71, true);">71</a>
-<a class="line-number" data-cell="combine" data-line="72" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 72, true);">72</a>
-<a class="line-number" data-cell="combine" data-line="73" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 73, true);">73</a>
-<a class="line-number" data-cell="combine" data-line="74" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 74, true);">74</a>
-<a class="line-number" data-cell="combine" data-line="75" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 75, true);">75</a>
-<a class="line-number" data-cell="combine" data-line="76" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 76, true);">76</a>
-<a class="line-number" data-cell="combine" data-line="77" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 77, true);">77</a>
-<a class="line-number" data-cell="combine" data-line="78" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 78, true);">78</a>
-<a class="line-number" data-cell="combine" data-line="79" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 79, true);">79</a>
-<a class="line-number" data-cell="combine" data-line="80" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 80, true);">80</a>
-<a class="line-number" data-cell="combine" data-line="81" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 81, true);">81</a>
-<a class="line-number" data-cell="combine" data-line="82" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 82, true);">82</a>
-<a class="line-number" data-cell="combine" data-line="83" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 83, true);">83</a>
-<a class="line-number" data-cell="combine" data-line="84" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 84, true);">84</a>
-<a class="line-number" data-cell="combine" data-line="85" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 85, true);">85</a>
-<a class="line-number" data-cell="combine" data-line="86" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 86, true);">86</a>
-<a class="line-number" data-cell="combine" data-line="87" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 87, true);">87</a>
-<a class="line-number" data-cell="combine" data-line="88" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 88, true);">88</a>
-<a class="line-number" data-cell="combine" data-line="89" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 89, true);">89</a>
-<a class="line-number" data-cell="combine" data-line="90" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 90, true);">90</a>
-<a class="line-number" data-cell="combine" data-line="91" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 91, true);">91</a>
-<a class="line-number" data-cell="combine" data-line="92" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 92, true);">92</a>
-<a class="line-number" data-cell="combine" data-line="93" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 93, true);">93</a>
-<a class="line-number" data-cell="combine" data-line="94" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 94, true);">94</a>
-<a class="line-number" data-cell="combine" data-line="95" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 95, true);">95</a>
-<a class="line-number" data-cell="combine" data-line="96" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 96, true);">96</a>
-<a class="line-number" data-cell="combine" data-line="97" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 97, true);">97</a>
-<a class="line-number" data-cell="combine" data-line="98" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 98, true);">98</a>
-<a class="line-number" data-cell="combine" data-line="99" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 99, true);">99</a>
-<a class="line-number" data-cell="combine" data-line="100" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 100, true);">100</a>
-<a class="line-number" data-cell="combine" data-line="101" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 101, true);">101</a>
-<a class="line-number" data-cell="combine" data-line="102" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 102, true);">102</a>
-<a class="line-number" data-cell="combine" data-line="103" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 103, true);">103</a>
-<a class="line-number" data-cell="combine" data-line="104" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 104, true);">104</a>
-<a class="line-number" data-cell="combine" data-line="105" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 105, true);">105</a>
-<a class="line-number" data-cell="combine" data-line="106" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 106, true);">106</a>
-<a class="line-number" data-cell="combine" data-line="107" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 107, true);">107</a>
-<a class="line-number" data-cell="combine" data-line="108" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 108, true);">108</a>
-<a class="line-number" data-cell="combine" data-line="109" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 109, true);">109</a>
-<a class="line-number" data-cell="combine" data-line="110" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 110, true);">110</a>
-<a class="line-number" data-cell="combine" data-line="111" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 111, true);">111</a>
-<a class="line-number" data-cell="combine" data-line="112" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 112, true);">112</a>
-<a class="line-number" data-cell="combine" data-line="113" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 113, true);">113</a>
-<a class="line-number" data-cell="combine" data-line="114" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 114, true);">114</a>
-<a class="line-number" data-cell="combine" data-line="115" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 115, true);">115</a>
-<a class="line-number" data-cell="combine" data-line="116" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 116, true);">116</a>
-<a class="line-number" data-cell="combine" data-line="117" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 117, true);">117</a>
-<a class="line-number" data-cell="combine" data-line="118" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 118, true);">118</a>
-<a class="line-number" data-cell="combine" data-line="119" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 119, true);">119</a>
-<a class="line-number" data-cell="combine" data-line="120" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 120, true);">120</a>
-<a class="line-number" data-cell="combine" data-line="121" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 121, true);">121</a>
-<a class="line-number" data-cell="combine" data-line="122" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 122, true);">122</a>
-<a class="line-number" data-cell="combine" data-line="123" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 123, true);">123</a>
-<a class="line-number" data-cell="combine" data-line="124" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 124, true);">124</a>
-<a class="line-number" data-cell="combine" data-line="125" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 125, true);">125</a>
-<a class="line-number" data-cell="combine" data-line="126" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 126, true);">126</a>
-<a class="line-number" data-cell="combine" data-line="127" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 127, true);">127</a>
-<a class="line-number" data-cell="combine" data-line="128" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 128, true);">128</a>
-<a class="line-number" data-cell="combine" data-line="129" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 129, true);">129</a>
-<a class="line-number" data-cell="combine" data-line="130" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 130, true);">130</a>
-<a class="line-number" data-cell="combine" data-line="131" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 131, true);">131</a>
-<a class="line-number" data-cell="combine" data-line="132" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 132, true);">132</a>
-<a class="line-number" data-cell="combine" data-line="133" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 133, true);">133</a>
-<a class="line-number" data-cell="combine" data-line="134" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 134, true);">134</a>
-<a class="line-number" data-cell="combine" data-line="135" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 135, true);">135</a>
-<a class="line-number" data-cell="combine" data-line="136" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 136, true);">136</a>
-<a class="line-number" data-cell="combine" data-line="137" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 137, true);">137</a>
-<a class="line-number" data-cell="combine" data-line="138" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 138, true);">138</a>
-<a class="line-number" data-cell="combine" data-line="139" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 139, true);">139</a>
-<a class="line-number" data-cell="combine" data-line="140" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 140, true);">140</a>
-<a class="line-number" data-cell="combine" data-line="141" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 141, true);">141</a>
-<a class="line-number" data-cell="combine" data-line="142" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 142, true);">142</a>
-<a class="line-number" data-cell="combine" data-line="143" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 143, true);">143</a>
-<a class="line-number" data-cell="combine" data-line="144" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 144, true);">144</a>
-<a class="line-number" data-cell="combine" data-line="145" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 145, true);">145</a>
-<a class="line-number" data-cell="combine" data-line="146" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 146, true);">146</a>
-<a class="line-number" data-cell="combine" data-line="147" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 147, true);">147</a>
-<a class="line-number" data-cell="combine" data-line="148" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 148, true);">148</a>
-<a class="line-number" data-cell="combine" data-line="149" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 149, true);">149</a>
-<a class="line-number" data-cell="combine" data-line="150" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 150, true);">150</a>
-<a class="line-number" data-cell="combine" data-line="151" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 151, true);">151</a>
-<a class="line-number" data-cell="combine" data-line="152" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 152, true);">152</a>
-<a class="line-number" data-cell="combine" data-line="153" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 153, true);">153</a>
-<a class="line-number" data-cell="combine" data-line="154" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 154, true);">154</a>
-<a class="line-number" data-cell="combine" data-line="155" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 155, true);">155</a>
-<a class="line-number" data-cell="combine" data-line="156" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 156, true);">156</a>
-<a class="line-number" data-cell="combine" data-line="157" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 157, true);">157</a>
-<a class="line-number" data-cell="combine" data-line="158" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 158, true);">158</a>
-<a class="line-number" data-cell="combine" data-line="159" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 159, true);">159</a>
-<a class="line-number" data-cell="combine" data-line="160" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 160, true);">160</a>
-<a class="line-number" data-cell="combine" data-line="161" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 161, true);">161</a>
-<a class="line-number" data-cell="combine" data-line="162" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 162, true);">162</a>
-<a class="line-number" data-cell="combine" data-line="163" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 163, true);">163</a>
-<a class="line-number" data-cell="combine" data-line="164" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 164, true);">164</a>
-<a class="line-number" data-cell="combine" data-line="165" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 165, true);">165</a>
-<a class="line-number" data-cell="combine" data-line="166" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 166, true);">166</a>
-<a class="line-number" data-cell="combine" data-line="167" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 167, true);">167</a>
-<a class="line-number" data-cell="combine" data-line="168" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 168, true);">168</a>
-<a class="line-number" data-cell="combine" data-line="169" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 169, true);">169</a>
-<a class="line-number" data-cell="combine" data-line="170" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 170, true);">170</a>
-<a class="line-number" data-cell="combine" data-line="171" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 171, true);">171</a>
-<a class="line-number" data-cell="combine" data-line="172" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 172, true);">172</a>
-<a class="line-number" data-cell="combine" data-line="173" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 173, true);">173</a>
-<a class="line-number" data-cell="combine" data-line="174" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 174, true);">174</a>
-<a class="line-number" data-cell="combine" data-line="175" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 175, true);">175</a>
-<a class="line-number" data-cell="combine" data-line="176" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 176, true);">176</a>
-<a class="line-number" data-cell="combine" data-line="177" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 177, true);">177</a>
-<a class="line-number" data-cell="combine" data-line="178" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 178, true);">178</a>
-<a class="line-number" data-cell="combine" data-line="179" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 179, true);">179</a>
-<a class="line-number" data-cell="combine" data-line="180" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 180, true);">180</a>
-<a class="line-number" data-cell="combine" data-line="181" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 181, true);">181</a>
-<a class="line-number" data-cell="combine" data-line="182" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 182, true);">182</a>
-<a class="line-number" data-cell="combine" data-line="183" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 183, true);">183</a>
-<a class="line-number" data-cell="combine" data-line="184" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 184, true);">184</a>
-<a class="line-number" data-cell="combine" data-line="185" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 185, true);">185</a>
-<a class="line-number" data-cell="combine" data-line="186" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 186, true);">186</a>
-<a class="line-number" data-cell="combine" data-line="187" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 187, true);">187</a>
-<a class="line-number" data-cell="combine" data-line="188" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 188, true);">188</a>
-<a class="line-number" data-cell="combine" data-line="189" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 189, true);">189</a>
-<a class="line-number" data-cell="combine" data-line="190" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 190, true);">190</a>
-<a class="line-number" data-cell="combine" data-line="191" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 191, true);">191</a>
-<a class="line-number" data-cell="combine" data-line="192" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 192, true);">192</a>
-<a class="line-number" data-cell="combine" data-line="193" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 193, true);">193</a>
-<a class="line-number" data-cell="combine" data-line="194" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 194, true);">194</a>
-<a class="line-number" data-cell="combine" data-line="195" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 195, true);">195</a>
-<a class="line-number" data-cell="combine" data-line="196" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 196, true);">196</a>
-<a class="line-number" data-cell="combine" data-line="197" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 197, true);">197</a>
-<a class="line-number" data-cell="combine" data-line="198" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 198, true);">198</a>
-<a class="line-number" data-cell="combine" data-line="199" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 199, true);">199</a>
-<a class="line-number" data-cell="combine" data-line="200" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 200, true);">200</a>
-<a class="line-number" data-cell="combine" data-line="201" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 201, true);">201</a>
-<a class="line-number" data-cell="combine" data-line="202" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 202, true);">202</a>
-<a class="line-number" data-cell="combine" data-line="203" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 203, true);">203</a>
-<a class="line-number" data-cell="combine" data-line="204" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 204, true);">204</a>
-<a class="line-number" data-cell="combine" data-line="205" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 205, true);">205</a>
-<a class="line-number" data-cell="combine" data-line="206" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 206, true);">206</a>
-<a class="line-number" data-cell="combine" data-line="207" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 207, true);">207</a>
-<a class="line-number" data-cell="combine" data-line="208" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 208, true);">208</a>
-<a class="line-number" data-cell="combine" data-line="209" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 209, true);">209</a>
-<a class="line-number" data-cell="combine" data-line="210" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 210, true);">210</a>
-<a class="line-number" data-cell="combine" data-line="211" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 211, true);">211</a>
-<a class="line-number" data-cell="combine" data-line="212" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 212, true);">212</a>
-<a class="line-number" data-cell="combine" data-line="213" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 213, true);">213</a>
-<a class="line-number" data-cell="combine" data-line="214" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 214, true);">214</a>
-<a class="line-number" data-cell="combine" data-line="215" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 215, true);">215</a>
-<a class="line-number" data-cell="combine" data-line="216" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 216, true);">216</a>
-<a class="line-number" data-cell="combine" data-line="217" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 217, true);">217</a>
-<a class="line-number" data-cell="combine" data-line="218" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 218, true);">218</a>
-<a class="line-number" data-cell="combine" data-line="219" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 219, true);">219</a>
-<a class="line-number" data-cell="combine" data-line="220" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 220, true);">220</a>
-<a class="line-number" data-cell="combine" data-line="221" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 221, true);">221</a>
-<a class="line-number" data-cell="combine" data-line="222" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 222, true);">222</a>
-<a class="line-number" data-cell="combine" data-line="223" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 223, true);">223</a>
-<a class="line-number" data-cell="combine" data-line="224" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 224, true);">224</a>
-<a class="line-number" data-cell="combine" data-line="225" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 225, true);">225</a>
-<a class="line-number" data-cell="combine" data-line="226" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 226, true);">226</a>
-<a class="line-number" data-cell="combine" data-line="227" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 227, true);">227</a>
-<a class="line-number" data-cell="combine" data-line="228" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 228, true);">228</a>
-<a class="line-number" data-cell="combine" data-line="229" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 229, true);">229</a>
-<a class="line-number" data-cell="combine" data-line="230" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 230, true);">230</a>
-<a class="line-number" data-cell="combine" data-line="231" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 231, true);">231</a>
-<a class="line-number" data-cell="combine" data-line="232" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 232, true);">232</a>
-<a class="line-number" data-cell="combine" data-line="233" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 233, true);">233</a>
-<a class="line-number" data-cell="combine" data-line="234" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 234, true);">234</a>
-<a class="line-number" data-cell="combine" data-line="235" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 235, true);">235</a>
-<a class="line-number" data-cell="combine" data-line="236" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 236, true);">236</a>
-<a class="line-number" data-cell="combine" data-line="237" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 237, true);">237</a>
-<a class="line-number" data-cell="combine" data-line="238" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 238, true);">238</a>
-<a class="line-number" data-cell="combine" data-line="239" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 239, true);">239</a>
-<a class="line-number" data-cell="combine" data-line="240" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 240, true);">240</a>
-<a class="line-number" data-cell="combine" data-line="241" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 241, true);">241</a>
-<a class="line-number" data-cell="combine" data-line="242" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 242, true);">242</a>
-<a class="line-number" data-cell="combine" data-line="243" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 243, true);">243</a>
-<a class="line-number" data-cell="combine" data-line="244" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 244, true);">244</a>
-<a class="line-number" data-cell="combine" data-line="245" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 245, true);">245</a>
-<a class="line-number" data-cell="combine" data-line="246" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 246, true);">246</a>
-<a class="line-number" data-cell="combine" data-line="247" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 247, true);">247</a>
-<a class="line-number" data-cell="combine" data-line="248" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 248, true);">248</a>
-<a class="line-number" data-cell="combine" data-line="249" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 249, true);">249</a>
-<a class="line-number" data-cell="combine" data-line="250" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 250, true);">250</a>
-<a class="line-number" data-cell="combine" data-line="251" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 251, true);">251</a>
-<a class="line-number" data-cell="combine" data-line="252" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 252, true);">252</a>
-<a class="line-number" data-cell="combine" data-line="253" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 253, true);">253</a>
-<a class="line-number" data-cell="combine" data-line="254" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 254, true);">254</a>
-<a class="line-number" data-cell="combine" data-line="255" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 255, true);">255</a>
-<a class="line-number" data-cell="combine" data-line="256" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 256, true);">256</a>
-<a class="line-number" data-cell="combine" data-line="257" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 257, true);">257</a>
-<a class="line-number" data-cell="combine" data-line="258" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 258, true);">258</a>
-<a class="line-number" data-cell="combine" data-line="259" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 259, true);">259</a>
-<a class="line-number" data-cell="combine" data-line="260" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 260, true);">260</a>
-<a class="line-number" data-cell="combine" data-line="261" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 261, true);">261</a>
-<a class="line-number" data-cell="combine" data-line="262" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 262, true);">262</a>
-<a class="line-number" data-cell="combine" data-line="263" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 263, true);">263</a>
-<a class="line-number" data-cell="combine" data-line="264" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 264, true);">264</a>
-<a class="line-number" data-cell="combine" data-line="265" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 265, true);">265</a>
-<a class="line-number" data-cell="combine" data-line="266" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 266, true);">266</a>
-<a class="line-number" data-cell="combine" data-line="267" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 267, true);">267</a>
-<a class="line-number" data-cell="combine" data-line="268" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 268, true);">268</a>
-<a class="line-number" data-cell="combine" data-line="269" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 269, true);">269</a>
-<a class="line-number" data-cell="combine" data-line="270" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 270, true);">270</a>
-<a class="line-number" data-cell="combine" data-line="271" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 271, true);">271</a>
-<a class="line-number" data-cell="combine" data-line="272" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 272, true);">272</a>
-<a class="line-number" data-cell="combine" data-line="273" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 273, true);">273</a>
-<a class="line-number" data-cell="combine" data-line="274" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 274, true);">274</a>
-<a class="line-number" data-cell="combine" data-line="275" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 275, true);">275</a>
-<a class="line-number" data-cell="combine" data-line="276" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 276, true);">276</a>
-<a class="line-number" data-cell="combine" data-line="277" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 277, true);">277</a>
-<a class="line-number" data-cell="combine" data-line="278" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 278, true);">278</a>
-<a class="line-number" data-cell="combine" data-line="279" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 279, true);">279</a>
-<a class="line-number" data-cell="combine" data-line="280" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 280, true);">280</a>
-<a class="line-number" data-cell="combine" data-line="281" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 281, true);">281</a>
-<a class="line-number" data-cell="combine" data-line="282" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 282, true);">282</a>
-<a class="line-number" data-cell="combine" data-line="283" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 283, true);">283</a>
-<a class="line-number" data-cell="combine" data-line="284" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 284, true);">284</a>
-<a class="line-number" data-cell="combine" data-line="285" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 285, true);">285</a>
-<a class="line-number" data-cell="combine" data-line="286" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 286, true);">286</a>
-<a class="line-number" data-cell="combine" data-line="287" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 287, true);">287</a>
-<a class="line-number" data-cell="combine" data-line="288" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 288, true);">288</a>
-<a class="line-number" data-cell="combine" data-line="289" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 289, true);">289</a>
-<a class="line-number" data-cell="combine" data-line="290" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 290, true);">290</a>
-<a class="line-number" data-cell="combine" data-line="291" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 291, true);">291</a>
-<a class="line-number" data-cell="combine" data-line="292" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 292, true);">292</a>
-<a class="line-number" data-cell="combine" data-line="293" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 293, true);">293</a>
-<a class="line-number" data-cell="combine" data-line="294" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 294, true);">294</a>
-<a class="line-number" data-cell="combine" data-line="295" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 295, true);">295</a>
-<a class="line-number" data-cell="combine" data-line="296" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 296, true);">296</a>
-<a class="line-number" data-cell="combine" data-line="297" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 297, true);">297</a>
-<a class="line-number" data-cell="combine" data-line="298" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 298, true);">298</a>
-<a class="line-number" data-cell="combine" data-line="299" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 299, true);">299</a>
-<a class="line-number" data-cell="combine" data-line="300" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 300, true);">300</a>
-<a class="line-number" data-cell="combine" data-line="301" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 301, true);">301</a>
-<a class="line-number" data-cell="combine" data-line="302" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 302, true);">302</a>
-<a class="line-number" data-cell="combine" data-line="303" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 303, true);">303</a>
-<a class="line-number" data-cell="combine" data-line="304" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 304, true);">304</a>
-<a class="line-number" data-cell="combine" data-line="305" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 305, true);">305</a>
-<a class="line-number" data-cell="combine" data-line="306" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 306, true);">306</a>
-<a class="line-number" data-cell="combine" data-line="307" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 307, true);">307</a>
-<a class="line-number" data-cell="combine" data-line="308" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 308, true);">308</a>
-<a class="line-number" data-cell="combine" data-line="309" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 309, true);">309</a>
-<a class="line-number" data-cell="combine" data-line="310" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 310, true);">310</a>
-<a class="line-number" data-cell="combine" data-line="311" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 311, true);">311</a>
-<a class="line-number" data-cell="combine" data-line="312" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 312, true);">312</a>
-<a class="line-number" data-cell="combine" data-line="313" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 313, true);">313</a>
-<a class="line-number" data-cell="combine" data-line="314" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 314, true);">314</a>
-<a class="line-number" data-cell="combine" data-line="315" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 315, true);">315</a>
-<a class="line-number" data-cell="combine" data-line="316" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 316, true);">316</a>
-<a class="line-number" data-cell="combine" data-line="317" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 317, true);">317</a>
-<a class="line-number" data-cell="combine" data-line="318" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 318, true);">318</a>
-<a class="line-number" data-cell="combine" data-line="319" href="#cell-combine" onclick="event.preventDefault(); selectCellLine('combine', 319, true);">319</a>
-</div>
+<div id="code-combine" class="cell-code" data-lines="69">
 <div class="code-wrap">
 <div class="highlight"><pre><span></span><span class="c1"># /// script</span>
 <span class="c1"># requires-python = &quot;&gt;=3.10&quot;</span>
-<span class="c1"># dependencies = [</span>
-<span class="c1">#     &quot;numpy&quot;,</span>
-<span class="c1">#     &quot;torch&quot;,</span>
-<span class="c1">#     &quot;kernels-benchmark-tools&quot;,</span>
-<span class="c1">#     &quot;matplotlib&quot;,</span>
-<span class="c1"># ]</span>
-<span class="c1">#</span>
+<span class="c1"># dependencies = [&quot;torch&quot;, &quot;kernels-benchmark-tools&quot;, &quot;matplotlib&quot;]</span>
 <span class="c1"># [tool.uv.sources]</span>
-<span class="c1"># kernels-benchmark-tools = { git = &quot;https://github.com/drbh/kernels-benchmark-tools.git&quot;, branch = &quot;main&quot; }</span>
+<span class="c1"># kernels-benchmark-tools = { path = &quot;../../../../../tools&quot;, editable = true }</span>
 <span class="c1"># ///</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">os</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">sys</span>
-<span class="kn">from</span><span class="w"> </span><span class="nn">pathlib</span><span class="w"> </span><span class="kn">import</span> <span class="n">Path</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">json</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">torch</span>  <span class="c1"># noqa: F401  # imported because upstream may expect torch to be importable</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">kernels_benchmark_tools</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">kbt</span>
-
-<span class="c1"># --- Matplotlib setup and helpers ------------------------------------------------</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">matplotlib</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">mpl</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">matplotlib.pyplot</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">plt</span>
-<span class="kn">import</span><span class="w"> </span><span class="nn">csv</span>
-
-
-<span class="c1"># Keep text as text (not paths) so CSS can style fonts, size, etc.</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;svg.fonttype&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
-<span class="c1"># Make ids deterministic across builds</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;svg.hashsalt&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;latency-benchmark-combined&quot;</span>
-<span class="c1"># Avoid auto-closed figures interfering with our tagging</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;figure.autolayout&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="kc">True</span>
-<span class="c1"># Make background transparent</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;figure.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;axes.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;savefig.facecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
-<span class="n">mpl</span><span class="o">.</span><span class="n">rcParams</span><span class="p">[</span><span class="s2">&quot;savefig.edgecolor&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;none&quot;</span>
-
-<span class="k">def</span><span class="w"> </span><span class="nf">_slugify</span><span class="p">(</span><span class="n">s</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="nb">str</span><span class="p">:</span>
-    <span class="n">s</span> <span class="o">=</span> <span class="p">(</span><span class="n">s</span> <span class="ow">or</span> <span class="s2">&quot;&quot;</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">lower</span><span class="p">()</span>
-    <span class="n">keep</span> <span class="o">=</span> <span class="p">[]</span>
-    <span class="k">for</span> <span class="n">ch</span> <span class="ow">in</span> <span class="n">s</span><span class="p">:</span>
-        <span class="k">if</span> <span class="n">ch</span><span class="o">.</span><span class="n">isalnum</span><span class="p">():</span>
-            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">ch</span><span class="p">)</span>
-        <span class="k">elif</span> <span class="n">ch</span> <span class="ow">in</span> <span class="p">(</span><span class="s2">&quot; &quot;</span><span class="p">,</span> <span class="s2">&quot;-&quot;</span><span class="p">,</span> <span class="s2">&quot;_&quot;</span><span class="p">,</span> <span class="s2">&quot;/&quot;</span><span class="p">,</span> <span class="s2">&quot;.&quot;</span><span class="p">,</span> <span class="s2">&quot;:&quot;</span><span class="p">):</span>
-            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;-&quot;</span><span class="p">)</span>
-        <span class="k">else</span><span class="p">:</span>
-            <span class="n">keep</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;&quot;</span><span class="p">)</span>
-    <span class="n">out</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">keep</span><span class="p">)</span>
-    <span class="k">while</span> <span class="s2">&quot;--&quot;</span> <span class="ow">in</span> <span class="n">out</span><span class="p">:</span>
-        <span class="n">out</span> <span class="o">=</span> <span class="n">out</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="s2">&quot;--&quot;</span><span class="p">,</span> <span class="s2">&quot;-&quot;</span><span class="p">)</span>
-    <span class="k">return</span> <span class="n">out</span><span class="o">.</span><span class="n">strip</span><span class="p">(</span><span class="s2">&quot;-&quot;</span><span class="p">)</span> <span class="ow">or</span> <span class="s2">&quot;unnamed&quot;</span>
-
-<span class="k">def</span><span class="w"> </span><span class="nf">_tag_current_figure</span><span class="p">(</span><span class="n">default_series_prefix</span><span class="o">=</span><span class="s2">&quot;series&quot;</span><span class="p">):</span>
-<span class="w">    </span><span class="sd">&quot;&quot;&quot;Attach SVG ids (gid) to key artists so they can be targeted from CSS.&quot;&quot;&quot;</span>
-    <span class="n">fig</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">gcf</span><span class="p">()</span>
-    <span class="k">if</span> <span class="n">fig</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>
-        <span class="k">return</span>
-
-    <span class="c1"># Tag the figure itself</span>
-    <span class="n">fig</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;figure--latency&quot;</span><span class="p">)</span>
-
-    <span class="k">for</span> <span class="n">ax_idx</span><span class="p">,</span> <span class="n">ax</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">fig</span><span class="o">.</span><span class="n">get_axes</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
-        <span class="n">ax</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;axes--</span><span class="si">{</span><span class="n">ax_idx</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Axis labels &amp; title</span>
-        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_title</span><span class="p">():</span>
-            <span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="n">ax</span><span class="o">.</span><span class="n">texts</span><span class="p">:</span>
-                <span class="k">if</span> <span class="n">t</span><span class="o">.</span><span class="n">get_text</span><span class="p">()</span> <span class="o">==</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_title</span><span class="p">():</span>
-                    <span class="n">t</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;title--main&quot;</span><span class="p">)</span>
-        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span> <span class="ow">and</span> <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span><span class="o">.</span><span class="n">get_label</span><span class="p">():</span>
-            <span class="n">ax</span><span class="o">.</span><span class="n">xaxis</span><span class="o">.</span><span class="n">label</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;label--x&quot;</span><span class="p">)</span>
-        <span class="k">if</span> <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span> <span class="ow">and</span> <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span><span class="o">.</span><span class="n">get_label</span><span class="p">():</span>
-            <span class="n">ax</span><span class="o">.</span><span class="n">yaxis</span><span class="o">.</span><span class="n">label</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;label--y&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Gridlines</span>
-        <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">gl</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">ax</span><span class="o">.</span><span class="n">get_xgridlines</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
-            <span class="n">gl</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;grid-x--</span><span class="si">{</span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-        <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">gl</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">ax</span><span class="o">.</span><span class="n">get_ygridlines</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
-            <span class="n">gl</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;grid-y--</span><span class="si">{</span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Legend block &amp; entries</span>
-        <span class="n">leg</span> <span class="o">=</span> <span class="n">ax</span><span class="o">.</span><span class="n">get_legend</span><span class="p">()</span>
-        <span class="k">if</span> <span class="n">leg</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
-            <span class="n">leg</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">)</span>
-            <span class="k">for</span> <span class="n">i</span><span class="p">,</span> <span class="n">txt</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">leg</span><span class="o">.</span><span class="n">get_texts</span><span class="p">(),</span> <span class="n">start</span><span class="o">=</span><span class="mi">1</span><span class="p">):</span>
-                <span class="n">label_slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">txt</span><span class="o">.</span><span class="n">get_text</span><span class="p">())</span>
-                <span class="n">txt</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;legend-label--</span><span class="si">{</span><span class="n">label_slug</span><span class="w"> </span><span class="ow">or</span><span class="w"> </span><span class="n">i</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Series (lines, patches)</span>
-        <span class="c1"># Lines</span>
-        <span class="n">line_seen</span> <span class="o">=</span> <span class="p">{}</span>
-        <span class="k">for</span> <span class="n">ln</span> <span class="ow">in</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">ax</span><span class="p">,</span> <span class="s2">&quot;lines&quot;</span><span class="p">,</span> <span class="p">[]):</span>
-            <span class="n">raw_label</span> <span class="o">=</span> <span class="n">ln</span><span class="o">.</span><span class="n">get_label</span><span class="p">()</span> <span class="ow">or</span> <span class="s2">&quot;&quot;</span>
-            <span class="c1"># Matplotlib uses labels beginning with &quot;_&quot; for non-legendable items</span>
-            <span class="n">label</span> <span class="o">=</span> <span class="n">raw_label</span> <span class="k">if</span> <span class="ow">not</span> <span class="n">raw_label</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;_&quot;</span><span class="p">)</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">default_series_prefix</span><span class="si">}</span><span class="s2">&quot;</span>
-            <span class="n">slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">label</span><span class="p">)</span>
-            <span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">=</span> <span class="n">line_seen</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">slug</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">+</span> <span class="mi">1</span>
-            <span class="n">suffix</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span> <span class="k">if</span> <span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">==</span> <span class="mi">1</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;-</span><span class="si">{</span><span class="n">line_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span><span class="si">}</span><span class="s2">&quot;</span>
-            <span class="n">ln</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;series--</span><span class="si">{</span><span class="n">slug</span><span class="si">}{</span><span class="n">suffix</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Patches (bars, areas)</span>
-        <span class="n">patch_seen</span> <span class="o">=</span> <span class="p">{}</span>
-        <span class="k">for</span> <span class="n">pt</span> <span class="ow">in</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">ax</span><span class="p">,</span> <span class="s2">&quot;patches&quot;</span><span class="p">,</span> <span class="p">[]):</span>
-            <span class="n">label</span> <span class="o">=</span> <span class="nb">getattr</span><span class="p">(</span><span class="n">pt</span><span class="p">,</span> <span class="s2">&quot;get_label&quot;</span><span class="p">,</span> <span class="k">lambda</span><span class="p">:</span> <span class="s2">&quot;&quot;</span><span class="p">)()</span> <span class="ow">or</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">default_series_prefix</span><span class="si">}</span><span class="s2">&quot;</span>
-            <span class="k">if</span> <span class="nb">isinstance</span><span class="p">(</span><span class="n">label</span><span class="p">,</span> <span class="nb">str</span><span class="p">)</span> <span class="ow">and</span> <span class="n">label</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;_&quot;</span><span class="p">):</span>
-                <span class="n">label</span> <span class="o">=</span> <span class="n">default_series_prefix</span>
-            <span class="n">slug</span> <span class="o">=</span> <span class="n">_slugify</span><span class="p">(</span><span class="n">label</span><span class="p">)</span>
-            <span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">=</span> <span class="n">patch_seen</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">slug</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">+</span> <span class="mi">1</span>
-            <span class="n">suffix</span> <span class="o">=</span> <span class="s2">&quot;&quot;</span> <span class="k">if</span> <span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span> <span class="o">==</span> <span class="mi">1</span> <span class="k">else</span> <span class="sa">f</span><span class="s2">&quot;-</span><span class="si">{</span><span class="n">patch_seen</span><span class="p">[</span><span class="n">slug</span><span class="p">]</span><span class="si">}</span><span class="s2">&quot;</span>
-            <span class="n">pt</span><span class="o">.</span><span class="n">set_gid</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;series--</span><span class="si">{</span><span class="n">slug</span><span class="si">}{</span><span class="n">suffix</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-<span class="k">def</span><span class="w"> </span><span class="nf">_postprocess_svg_add_classes</span><span class="p">(</span><span class="n">svg_path</span><span class="p">:</span> <span class="n">Path</span><span class="p">):</span>
-<span class="w">    </span><span class="sd">&quot;&quot;&quot;Add convenient CSS classes alongside ids (e.g., class=&#39;series grid grid-x&#39;).&quot;&quot;&quot;</span>
-    <span class="k">try</span><span class="p">:</span>
-        <span class="kn">import</span><span class="w"> </span><span class="nn">xml.etree.ElementTree</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">ET</span>
-        <span class="n">ET</span><span class="o">.</span><span class="n">register_namespace</span><span class="p">(</span><span class="s2">&quot;&quot;</span><span class="p">,</span> <span class="s2">&quot;http://www.w3.org/2000/svg&quot;</span><span class="p">)</span>
-        <span class="n">tree</span> <span class="o">=</span> <span class="n">ET</span><span class="o">.</span><span class="n">parse</span><span class="p">(</span><span class="n">svg_path</span><span class="p">)</span>
-        <span class="n">root</span> <span class="o">=</span> <span class="n">tree</span><span class="o">.</span><span class="n">getroot</span><span class="p">()</span>
-        <span class="k">for</span> <span class="n">el</span> <span class="ow">in</span> <span class="n">root</span><span class="o">.</span><span class="n">iter</span><span class="p">():</span>
-            <span class="n">el_id</span> <span class="o">=</span> <span class="n">el</span><span class="o">.</span><span class="n">attrib</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">&quot;id&quot;</span><span class="p">,</span> <span class="s2">&quot;&quot;</span><span class="p">)</span>
-            <span class="k">if</span> <span class="ow">not</span> <span class="n">el_id</span><span class="p">:</span>
-                <span class="k">continue</span>
-            <span class="bp">cls</span> <span class="o">=</span> <span class="p">[]</span>
-            <span class="k">if</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;figure--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;figure&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;axes--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;axes&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;grid-x--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span> <span class="o">+=</span> <span class="p">[</span><span class="s2">&quot;grid&quot;</span><span class="p">,</span> <span class="s2">&quot;grid-x&quot;</span><span class="p">]</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;grid-y--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span> <span class="o">+=</span> <span class="p">[</span><span class="s2">&quot;grid&quot;</span><span class="p">,</span> <span class="s2">&quot;grid-y&quot;</span><span class="p">]</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;legend&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;label--x&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;xlabel&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;label--y&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;ylabel&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;title--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;title&quot;</span><span class="p">)</span>
-            <span class="k">elif</span> <span class="n">el_id</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">&quot;series--&quot;</span><span class="p">):</span>
-                <span class="bp">cls</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="s2">&quot;series&quot;</span><span class="p">)</span>
-            <span class="k">if</span> <span class="bp">cls</span><span class="p">:</span>
-                <span class="c1"># Preserve any existing class (unlikely from Matplotlib)</span>
-                <span class="n">existing</span> <span class="o">=</span> <span class="n">el</span><span class="o">.</span><span class="n">attrib</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">&quot;class&quot;</span><span class="p">,</span> <span class="s2">&quot;&quot;</span><span class="p">)</span>
-                <span class="n">el</span><span class="o">.</span><span class="n">set</span><span class="p">(</span><span class="s2">&quot;class&quot;</span><span class="p">,</span> <span class="p">(</span><span class="n">existing</span> <span class="o">+</span> <span class="s2">&quot; &quot;</span> <span class="o">+</span> <span class="s2">&quot; &quot;</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="bp">cls</span><span class="p">))</span><span class="o">.</span><span class="n">strip</span><span class="p">())</span>
-        <span class="n">tree</span><span class="o">.</span><span class="n">write</span><span class="p">(</span><span class="n">svg_path</span><span class="p">,</span> <span class="n">encoding</span><span class="o">=</span><span class="s2">&quot;utf-8&quot;</span><span class="p">,</span> <span class="n">xml_declaration</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
-    <span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ SVG postprocess (classes) skipped: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-<span class="c1"># Monkey-patch savefig to force SVG &amp; ensure tagging occurs even if kbt.viz saves internally.</span>
-<span class="n">_orig_savefig</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span>
-<span class="k">def</span><span class="w"> </span><span class="nf">_savefig_svg</span><span class="p">(</span><span class="n">fname</span><span class="p">,</span> <span class="o">*</span><span class="n">args</span><span class="p">,</span> <span class="o">**</span><span class="n">kwargs</span><span class="p">):</span>
-    <span class="c1"># Always save as SVG at a stable path for the artifact system</span>
-    <span class="n">out</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">)</span>
-    <span class="n">kwargs</span><span class="p">[</span><span class="s2">&quot;format&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="s2">&quot;svg&quot;</span>
-    <span class="c1"># Ensure everything we care about has ids before export</span>
-    <span class="n">_tag_current_figure</span><span class="p">()</span>
-    <span class="n">res</span> <span class="o">=</span> <span class="n">_orig_savefig</span><span class="p">(</span><span class="n">out</span><span class="p">,</span> <span class="o">*</span><span class="n">args</span><span class="p">,</span> <span class="o">**</span><span class="n">kwargs</span><span class="p">)</span>
-    <span class="c1"># Add helpful CSS classes on top of ids</span>
-    <span class="n">_postprocess_svg_add_classes</span><span class="p">(</span><span class="n">out</span><span class="p">)</span>
-    <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ Combined visualization saved as </span><span class="si">{</span><span class="n">out</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-    <span class="k">return</span> <span class="n">res</span>
-
-<span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_savefig_svg</span>  <span class="c1"># apply patch</span>
-
-<span class="c1"># Capture close calls in case kbt.viz() closes figures before we re-save</span>
-<span class="n">_orig_close</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">close</span>
-<span class="n">_last_closed</span> <span class="o">=</span> <span class="p">{</span><span class="s2">&quot;fig&quot;</span><span class="p">:</span> <span class="kc">None</span><span class="p">}</span>
-<span class="k">def</span><span class="w"> </span><span class="nf">_capture_close</span><span class="p">(</span><span class="n">arg</span><span class="o">=</span><span class="kc">None</span><span class="p">):</span>
-    <span class="k">try</span><span class="p">:</span>
-        <span class="k">if</span> <span class="nb">hasattr</span><span class="p">(</span><span class="n">arg</span><span class="p">,</span> <span class="s2">&quot;savefig&quot;</span><span class="p">):</span>  <span class="c1"># looks like a Figure</span>
-            <span class="n">_last_closed</span><span class="p">[</span><span class="s2">&quot;fig&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">arg</span>
-        <span class="k">else</span><span class="p">:</span>
-            <span class="n">_last_closed</span><span class="p">[</span><span class="s2">&quot;fig&quot;</span><span class="p">]</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">gcf</span><span class="p">()</span>
-    <span class="k">finally</span><span class="p">:</span>
-        <span class="k">return</span> <span class="n">_orig_close</span><span class="p">(</span><span class="n">arg</span><span class="p">)</span>
-<span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_capture_close</span>
-
-<span class="c1"># --- Locate benchmark artifacts --------------------------------------------------</span>
-<span class="n">cache_dirs</span> <span class="o">=</span> <span class="p">{</span>
-    <span class="s2">&quot;Flash (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_FLASH_ATTENTION_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;MemEff (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_MEM_EFFICIENT_ATTENTION_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;Flash Attn 2&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_FLASH_ATTN2_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;xFormers&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_XFORMERS_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;SageAttention&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_SAGE_ATTENTION_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;Compiled (default)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_COMPILED_VARIANTS_BENCHMARK_DEFAULT&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;Compiled (max-autotune)&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_COMPILED_VARIANTS_BENCHMARK_MAX_AUTOTUNE&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;HF Kernels Flash Attn&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_HF_KERNELS_FLASH_ATTN_BENCHMARK&#39;</span><span class="p">),</span>
-    <span class="s2">&quot;HF Kernels Flash Attn3&quot;</span><span class="p">:</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;UVNOTE_FILE_HF_KERNELS_FLASH_ATTN3_BENCHMARK&#39;</span><span class="p">),</span>
+<span class="kn">from</span><span class="w"> </span><span class="nn">kernels_benchmark_tools.core.visuals</span><span class="w"> </span><span class="kn">import</span> <span class="n">generate_combined_results</span>
+
+<span class="c1"># Note: Flash attention has multiple implementations with different output files</span>
+<span class="c1"># Some use attn.jsonl, compiled variants use attn_default.jsonl and attn_max_autotune.jsonl</span>
+<span class="n">cache_env_map</span> <span class="o">=</span> <span class="p">{</span>
+    <span class="s2">&quot;Flash (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_FLASH_ATTENTION_BENCHMARK&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;MemEff (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_MEM_EFFICIENT_ATTENTION_BENCHMARK&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;xFormers&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_XFORMERS_BENCHMARK&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;Compiled (default)&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_COMPILED_VARIANTS_BENCHMARK_DEFAULT&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;Compiled (max-autotune)&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_COMPILED_VARIANTS_BENCHMARK_MAX_AUTOTUNE&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;HF Kernels Flash Attn&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_HF_KERNELS_FLASH_ATTN_BENCHMARK&quot;</span><span class="p">,</span>
+    <span class="s2">&quot;HF Kernels Flash Attn3&quot;</span><span class="p">:</span> <span class="s2">&quot;UVNOTE_FILE_HF_KERNELS_FLASH_ATTN3_BENCHMARK&quot;</span><span class="p">,</span>
 <span class="p">}</span>
 
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;LOADING BENCHMARK DATA&quot;</span><span class="p">)</span>
-<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
-    <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">name</span><span class="si">:</span><span class="s2">30s</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">cache_dir</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">()</span>
+<span class="c1"># For flash attention, we need custom file mapping</span>
+<span class="kn">import</span><span class="w"> </span><span class="nn">os</span>
+<span class="kn">from</span><span class="w"> </span><span class="nn">pathlib</span><span class="w"> </span><span class="kn">import</span> <span class="n">Path</span>
 
 <span class="n">file_mapping</span> <span class="o">=</span> <span class="p">{</span>
-    <span class="s2">&quot;Flash (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;MemEff (PyTorch SDPA)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;Flash Attn 2&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;xFormers&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;SageAttention&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
     <span class="s2">&quot;Compiled (default)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn_default.jsonl&quot;</span><span class="p">,</span>
     <span class="s2">&quot;Compiled (max-autotune)&quot;</span><span class="p">:</span> <span class="s2">&quot;attn_max_autotune.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;HF Kernels Flash Attn&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
-    <span class="s2">&quot;HF Kernels Flash Attn3&quot;</span><span class="p">:</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">,</span>
 <span class="p">}</span>
 
+<span class="c1"># Collect paths with custom file names for compiled variants</span>
 <span class="n">all_paths</span> <span class="o">=</span> <span class="p">[]</span>
-<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
+<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">env_var</span> <span class="ow">in</span> <span class="n">cache_env_map</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
+    <span class="n">cache_dir</span> <span class="o">=</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">env_var</span><span class="p">)</span>
     <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
-        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
+        <span class="n">filename</span> <span class="o">=</span> <span class="n">file_mapping</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="n">name</span><span class="p">,</span> <span class="s2">&quot;attn.jsonl&quot;</span><span class="p">)</span>
+        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">filename</span>
         <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
             <span class="n">all_paths</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="nb">str</span><span class="p">(</span><span class="n">path</span><span class="p">))</span>
             <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ Found </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
         <span class="k">else</span><span class="p">:</span>
-            <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;⊘ Empty/Missing </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+            <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;⊘ Skipped </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">: </span><span class="si">{</span><span class="n">path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
     <span class="k">else</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ No cache dir for </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">()</span>
+        <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ Missing </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
 
 <span class="k">if</span> <span class="ow">not</span> <span class="n">all_paths</span><span class="p">:</span>
     <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;ERROR: No benchmark data files found!&quot;</span><span class="p">)</span>
-    <span class="c1"># restore patched functions before exiting</span>
-    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_orig_savefig</span>
-    <span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_orig_close</span>
+    <span class="kn">import</span><span class="w"> </span><span class="nn">sys</span>
     <span class="n">sys</span><span class="o">.</span><span class="n">exit</span><span class="p">(</span><span class="mi">1</span><span class="p">)</span>
 
-<span class="c1"># --- Summary + Visualization -----------------------------------------------------</span>
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;COMBINED BENCHMARK SUMMARY</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="n">kbt</span><span class="o">.</span><span class="n">summarize</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">GENERATING COMBINED VISUALIZATION</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
+<span class="c1"># Use the simplified visualization</span>
+<span class="kn">from</span><span class="w"> </span><span class="nn">kernels_benchmark_tools.core</span><span class="w"> </span><span class="kn">import</span> <span class="n">tools</span>
+<span class="kn">from</span><span class="w"> </span><span class="nn">kernels_benchmark_tools.core.visuals</span><span class="w"> </span><span class="kn">import</span> <span class="n">setup_svg_matplotlib</span><span class="p">,</span> <span class="n">create_svg_with_tagging</span>
+
+<span class="n">setup_svg_matplotlib</span><span class="p">()</span>
+<span class="n">_orig_savefig</span><span class="p">,</span> <span class="n">_orig_close</span> <span class="o">=</span> <span class="n">create_svg_with_tagging</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">,</span> <span class="s2">&quot;flash-attention&quot;</span><span class="p">)</span>
 
 <span class="k">try</span><span class="p">:</span>
-    <span class="c1"># If kbt.viz saves internally, our patched savefig ensures SVG gets written,</span>
-    <span class="c1"># and it will carry ids/classes for CSS styling.</span>
-    <span class="n">kbt</span><span class="o">.</span><span class="n">viz</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
-    <span class="c1"># Safety net: if kbt.viz didn&#39;t save, save now.</span>
-    <span class="c1"># if not Path(&quot;latency.svg&quot;).exists():</span>
-    <span class="c1">#     _tag_current_figure()</span>
-    <span class="c1"># plt.savefig(&quot;latency.svg&quot;)</span>
-
-    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">)</span>  <span class="c1"># ensure saved with tagging</span>
-
-    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;✓ SVG visualization ready: latency.svg!&quot;</span><span class="p">)</span>
-<span class="k">except</span> <span class="ne">ImportError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
-    <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ Visualization requires matplotlib: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
-    <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✗ Visualization failed: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
+    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">COMBINED BENCHMARK SUMMARY</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
+    <span class="n">tools</span><span class="o">.</span><span class="n">summarize</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
+
+    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">GENERATING COMBINED VISUALIZATION</span><span class="se">\n</span><span class="s2">&quot;</span><span class="p">)</span>
+    <span class="n">tools</span><span class="o">.</span><span class="n">viz</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span>
+
+    <span class="kn">import</span><span class="w"> </span><span class="nn">matplotlib.pyplot</span><span class="w"> </span><span class="k">as</span><span class="w"> </span><span class="nn">plt</span>
+    <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span><span class="p">(</span><span class="s2">&quot;latency.svg&quot;</span><span class="p">)</span>
+    <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;✓ SVG visualization ready!&quot;</span><span class="p">)</span>
 <span class="k">finally</span><span class="p">:</span>
-    <span class="c1"># Clean up patches to avoid side effects in later cells</span>
     <span class="n">plt</span><span class="o">.</span><span class="n">savefig</span> <span class="o">=</span> <span class="n">_orig_savefig</span>
     <span class="n">plt</span><span class="o">.</span><span class="n">close</span> <span class="o">=</span> <span class="n">_orig_close</span>
-
-<span class="nb">print</span><span class="p">()</span>
-<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;ANALYSIS COMPLETE&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Total implementations analyzed: </span><span class="si">{</span><span class="nb">len</span><span class="p">(</span><span class="n">all_paths</span><span class="p">)</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;</span><span class="se">\n</span><span class="s2">Implementations included:&quot;</span><span class="p">)</span>
-<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
-    <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
-        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
-        <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
-            <span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;  ✓ </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-
-
-
-<span class="c1"># Collect all benchmark data and export to CSV</span>
-<span class="n">all_data</span> <span class="o">=</span> <span class="p">{}</span>
-<span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">cache_dir</span> <span class="ow">in</span> <span class="n">cache_dirs</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
-    <span class="k">if</span> <span class="n">cache_dir</span><span class="p">:</span>
-        <span class="n">path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">cache_dir</span><span class="p">)</span> <span class="o">/</span> <span class="n">file_mapping</span><span class="p">[</span><span class="n">name</span><span class="p">]</span>
-        <span class="k">if</span> <span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">()</span> <span class="ow">and</span> <span class="n">path</span><span class="o">.</span><span class="n">stat</span><span class="p">()</span><span class="o">.</span><span class="n">st_size</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span>
-            <span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">path</span><span class="p">,</span> <span class="s1">&#39;r&#39;</span><span class="p">)</span> <span class="k">as</span> <span class="n">f</span><span class="p">:</span>
-                <span class="n">records</span> <span class="o">=</span> <span class="p">[</span><span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">line</span><span class="p">)</span> <span class="k">for</span> <span class="n">line</span> <span class="ow">in</span> <span class="n">f</span><span class="p">]</span>
-                <span class="n">all_data</span><span class="p">[</span><span class="n">name</span><span class="p">]</span> <span class="o">=</span> <span class="n">records</span>
-
-<span class="c1"># Export to CSV</span>
-<span class="n">csv_path</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="s2">&quot;latency.csv&quot;</span><span class="p">)</span>
-<span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">csv_path</span><span class="p">,</span> <span class="s1">&#39;w&#39;</span><span class="p">,</span> <span class="n">newline</span><span class="o">=</span><span class="s1">&#39;&#39;</span><span class="p">)</span> <span class="k">as</span> <span class="n">csvfile</span><span class="p">:</span>
-    <span class="n">writer</span> <span class="o">=</span> <span class="n">csv</span><span class="o">.</span><span class="n">writer</span><span class="p">(</span><span class="n">csvfile</span><span class="p">)</span>
-
-    <span class="c1"># Write header</span>
-    <span class="n">header</span> <span class="o">=</span> <span class="p">[</span><span class="s2">&quot;Implementation&quot;</span><span class="p">,</span> <span class="s2">&quot;Impl ID&quot;</span><span class="p">,</span> <span class="s2">&quot;Workload&quot;</span><span class="p">,</span> <span class="s2">&quot;Batch&quot;</span><span class="p">,</span> <span class="s2">&quot;Seq Length&quot;</span><span class="p">,</span> <span class="s2">&quot;Heads&quot;</span><span class="p">,</span> <span class="s2">&quot;Head Dim&quot;</span><span class="p">,</span> <span class="s2">&quot;Dtype&quot;</span><span class="p">,</span>
-              <span class="s2">&quot;Mean (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P10 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P50 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;P90 (ms)&quot;</span><span class="p">,</span> <span class="s2">&quot;Reps&quot;</span><span class="p">,</span> 
-            <span class="c1">#   &quot;Compile (ms)&quot;, </span>
-              <span class="s2">&quot;Peak Mem (MB)&quot;</span><span class="p">,</span> <span class="s2">&quot;Backend&quot;</span><span class="p">,</span> <span class="s2">&quot;Family&quot;</span><span class="p">]</span>
-    <span class="n">writer</span><span class="o">.</span><span class="n">writerow</span><span class="p">(</span><span class="n">header</span><span class="p">)</span>
-
-    <span class="c1"># Write data rows</span>
-    <span class="k">for</span> <span class="n">impl_name</span><span class="p">,</span> <span class="n">records</span> <span class="ow">in</span> <span class="n">all_data</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
-        <span class="k">for</span> <span class="n">record</span> <span class="ow">in</span> <span class="n">records</span><span class="p">:</span>
-            <span class="n">wl</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;wl&#39;</span><span class="p">,</span> <span class="p">{})</span>
-            <span class="n">lat</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;lat_ms&#39;</span><span class="p">,</span> <span class="p">{})</span>
-            <span class="n">tags</span> <span class="o">=</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;tags&#39;</span><span class="p">,</span> <span class="p">{})</span>
-
-            <span class="n">row</span> <span class="o">=</span> <span class="p">[</span>
-                <span class="n">impl_name</span><span class="p">,</span>
-                <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;impl&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;name&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;batch&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;seq_len&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;heads&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;head_dim&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">wl</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;dtype&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;mean&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p10&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p50&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;p90&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">lat</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;reps&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="c1"># record.get(&#39;compile_ms&#39;, &#39;&#39;),</span>
-                <span class="nb">round</span><span class="p">(</span><span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;peak_bytes&#39;</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">/</span> <span class="mi">1024</span> <span class="o">/</span> <span class="mi">1024</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span> <span class="k">if</span> <span class="n">record</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;peak_bytes&#39;</span><span class="p">)</span> <span class="k">else</span> <span class="s1">&#39;&#39;</span><span class="p">,</span>
-                <span class="n">tags</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;backend&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-                <span class="n">tags</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s1">&#39;family&#39;</span><span class="p">,</span> <span class="s1">&#39;&#39;</span><span class="p">),</span>
-            <span class="p">]</span>
-            <span class="n">writer</span><span class="o">.</span><span class="n">writerow</span><span class="p">(</span><span class="n">row</span><span class="p">)</span>
-
-<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;✓ CSV export complete: </span><span class="si">{</span><span class="n">csv_path</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Total implementations: </span><span class="si">{</span><span class="nb">len</span><span class="p">(</span><span class="n">all_data</span><span class="p">)</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
-<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot;Total records: </span><span class="si">{</span><span class="nb">sum</span><span class="p">(</span><span class="nb">len</span><span class="p">(</span><span class="n">records</span><span class="p">)</span><span class="w"> </span><span class="k">for</span><span class="w"> </span><span class="n">records</span><span class="w"> </span><span class="ow">in</span><span class="w"> </span><span class="n">all_data</span><span class="o">.</span><span class="n">values</span><span class="p">())</span><span class="si">}</span><span class="s2">&quot;</span><span class="p">)</span>
 </pre></div>
 
 <div class="code-line-highlight" id="line-highlight-combine"></div>
 </div>
 </div>
-</div>
-<div id="output-combine" class="cell-output collapsed">
-<div class="cell-stdout">LOADING BENCHMARK DATA
-Flash (PyTorch SDPA)          : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/dfabb76be980c54bed5516e2c57aa0a8d1d29c88b8b1d32ce8f8eb1b96260e90
-MemEff (PyTorch SDPA)         : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/b55d0f8b9e1a42ce197ed67716743fb2bd3bd76a1c4eef86ae36338351e6458d
-Flash Attn 2                  : None
-xFormers                      : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/be950c5cf60d4cdaea76a6c38ab4fb7e6da509ca9833fced05c39f642981839a
-SageAttention                 : None
-Compiled (default)            : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/50695b32047eb68d75addc0415164aa59c26dd8b180acf56a0f2fc92ca88f9fe
-Compiled (max-autotune)       : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/e22033ba3f39f87c6b9bba3f26af59c09999dab741717146939479dd3e140834
-HF Kernels Flash Attn         : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/f5347da8e6f046c3e9a96cb7843f885425fe84602e9e6c10758773df819982c9
-HF Kernels Flash Attn3        : /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/482931c458dfb5bb4d51247d9e6348ae4d4932319d902903f6f858005c8f75f7
-
-✓ Found Flash (PyTorch SDPA): /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/dfabb76be980c54bed5516e2c57aa0a8d1d29c88b8b1d32ce8f8eb1b96260e90/attn.jsonl
-✓ Found MemEff (PyTorch SDPA): /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/b55d0f8b9e1a42ce197ed67716743fb2bd3bd76a1c4eef86ae36338351e6458d/attn.jsonl
-✗ No cache dir for Flash Attn 2
-✓ Found xFormers: /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/be950c5cf60d4cdaea76a6c38ab4fb7e6da509ca9833fced05c39f642981839a/attn.jsonl
-✗ No cache dir for SageAttention
-✓ Found Compiled (default): /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/50695b32047eb68d75addc0415164aa59c26dd8b180acf56a0f2fc92ca88f9fe/attn_default.jsonl
-✓ Found Compiled (max-autotune): /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/e22033ba3f39f87c6b9bba3f26af59c09999dab741717146939479dd3e140834/attn_max_autotune.jsonl
-✓ Found HF Kernels Flash Attn: /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/f5347da8e6f046c3e9a96cb7843f885425fe84602e9e6c10758773df819982c9/attn.jsonl
-✓ Found HF Kernels Flash Attn3: /home/ubuntu/Projects/kernels-uvnotes/flash_attn/impls/.uvnote/cache/482931c458dfb5bb4d51247d9e6348ae4d4932319d902903f6f858005c8f75f7/attn.jsonl
+<div id="output-combine" class="cell-output">
+<div class="cell-stdout"><pre class="stdout-text">✓ Found Flash (PyTorch SDPA): /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/669be66a140da2b4e0da461648c43c1d5d868bfecd1d86ce3c5cefe7bf6b5095/attn.jsonl
+✓ Found MemEff (PyTorch SDPA): /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/d50b1832883940bf8e1b301f9e544d51e67d3edfec86eea4427285c75792eca1/attn.jsonl
+✓ Found xFormers: /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/7663611410e2106f3875f69749feba575364abf561b07527376e06da9ccbca78/attn.jsonl
+✓ Found Compiled (default): /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/7a1d1c41a3d743b4b34d02393e8397ba23383940890d8fd1f4f46e296d62938e/attn_default.jsonl
+✓ Found Compiled (max-autotune): /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/314fe0e8997361ffe9c6a2252cce35c8b2184007bb328de7f71e529e42a46d73/attn_max_autotune.jsonl
+✓ Found HF Kernels Flash Attn: /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/60f199ad338be11b49f2e8e781c982a5f107106c0c1b7f43ced3be59820560c9/attn.jsonl
+✓ Found HF Kernels Flash Attn3: /__w/kernels-benchmarks/kernels-benchmarks/benches/flash_attn/impls/.uvnote/cache/a9419f7d27246259f950b2b3abce9149f1cf0c2d35d1bbc5af7cc75ae37baa6d/attn.jsonl
 
 COMBINED BENCHMARK SUMMARY
 
 impl                     wl                  p50(ms)  ok
-hf_kernels_flash_attn    flux_L128              0.25  True
-hf_kernels_flash_attn    flux_L256              0.32  True
-hf_kernels_flash_attn    flux_L320              0.34  True
-hf_kernels_flash_attn    flux_L384              0.35  True
-hf_kernels_flash_attn    flux_L448              0.38  True
-hf_kernels_flash_attn    flux_L512              0.42  True
-hf_kernels_flash_attn3   flux_L128              0.28  True
-hf_kernels_flash_attn3   flux_L256              0.34  True
-hf_kernels_flash_attn3   flux_L320              0.36  True
-hf_kernels_flash_attn3   flux_L384              0.37  True
-hf_kernels_flash_attn3   flux_L448              0.40  True
-hf_kernels_flash_attn3   flux_L512              0.43  True
-torch_flash_compiled_default flux_L128              0.36  True
-torch_flash_compiled_default flux_L256              0.50  True
-torch_flash_compiled_default flux_L320              0.54  True
-torch_flash_compiled_default flux_L384              0.59  True
-torch_flash_compiled_default flux_L448              0.61  True
-torch_flash_compiled_default flux_L512              0.64  True
-torch_flash_compiled_max_autotune flux_L128              0.38  True
-torch_flash_compiled_max_autotune flux_L256              0.55  True
-torch_flash_compiled_max_autotune flux_L320              0.61  True
-torch_flash_compiled_max_autotune flux_L384              0.66  True
-torch_flash_compiled_max_autotune flux_L448              0.70  True
-torch_flash_compiled_max_autotune flux_L512              0.76  True
-torch_flash_ma           flux_L128              0.41  True
-torch_flash_ma           flux_L256              0.52  True
-torch_flash_ma           flux_L320              0.55  True
-torch_flash_ma           flux_L384              0.59  True
-torch_flash_ma           flux_L448              0.64  True
-torch_flash_ma           flux_L512              0.68  True
-torch_mem_eff            flux_L128              0.48  True
-torch_mem_eff            flux_L256              0.63  True
-torch_mem_eff            flux_L320              0.70  True
-torch_mem_eff            flux_L384              0.83  True
-torch_mem_eff            flux_L448              0.95  True
-torch_mem_eff            flux_L512              1.00  True
-xformers_meff            flux_L128              0.35  True
-xformers_meff            flux_L256              0.41  True
-xformers_meff            flux_L320              0.43  True
-xformers_meff            flux_L384              0.44  True
-xformers_meff            flux_L448              0.48  True
-xformers_meff            flux_L512              0.50  True
+hf_kernels_flash_attn    flux_L128              0.12  True
+hf_kernels_flash_attn    flux_L256              0.14  True
+hf_kernels_flash_attn    flux_L320              0.14  True
+hf_kernels_flash_attn    flux_L384              0.15  True
+hf_kernels_flash_attn    flux_L448              0.20  True
+hf_kernels_flash_attn    flux_L512              0.20  True
+hf_kernels_flash_attn3   flux_L128              0.13  True
+hf_kernels_flash_attn3   flux_L256              0.15  True
+hf_kernels_flash_attn3   flux_L320              0.16  True
+hf_kernels_flash_attn3   flux_L384              0.16  True
+hf_kernels_flash_attn3   flux_L448              0.21  True
+hf_kernels_flash_attn3   flux_L512              0.21  True
+torch_flash_compiled_default flux_L128              0.20  True
+torch_flash_compiled_default flux_L256              0.23  True
+torch_flash_compiled_default flux_L320              0.24  True
+torch_flash_compiled_default flux_L384              0.24  True
+torch_flash_compiled_default flux_L448             FAIL  False
+  Error: recompile_limit reached with one_graph=True. Excessive recompilations can degrade performance due to the compilation overhead of each recompilation. To monitor recompilations, enable TORCH_LOGS=recompiles. If recompilations are expected, consider increasing torch._dynamo.config.cache_size_limit to an appropriate value.
+torch_flash_compiled_default flux_L512             FAIL  False
+  Error: recompile_limit reached with one_graph=True. Excessive recompilations can degrade performance due to the compilation overhead of each recompilation. To monitor recompilations, enable TORCH_LOGS=recompiles. If recompilations are expected, consider increasing torch._dynamo.config.cache_size_limit to an appropriate value.
+torch_flash_compiled_max_autotune flux_L128              0.19  True
+torch_flash_compiled_max_autotune flux_L256              0.20  True
+torch_flash_compiled_max_autotune flux_L320              0.21  True
+torch_flash_compiled_max_autotune flux_L384              0.21  True
+torch_flash_compiled_max_autotune flux_L448             FAIL  False
+  Error: recompile_limit reached with one_graph=True. Excessive recompilations can degrade performance due to the compilation overhead of each recompilation. To monitor recompilations, enable TORCH_LOGS=recompiles. If recompilations are expected, consider increasing torch._dynamo.config.cache_size_limit to an appropriate value.
+torch_flash_compiled_max_autotune flux_L512             FAIL  False
+  Error: recompile_limit reached with one_graph=True. Excessive recompilations can degrade performance due to the compilation overhead of each recompilation. To monitor recompilations, enable TORCH_LOGS=recompiles. If recompilations are expected, consider increasing torch._dynamo.config.cache_size_limit to an appropriate value.
+torch_flash_ma           flux_L128              0.18  True
+torch_flash_ma           flux_L256              0.21  True
+torch_flash_ma           flux_L320              0.22  True
+torch_flash_ma           flux_L384              0.22  True
+torch_flash_ma           flux_L448              0.27  True
+torch_flash_ma           flux_L512              0.28  True
+torch_mem_eff            flux_L128              0.23  True
+torch_mem_eff            flux_L256              0.26  True
+torch_mem_eff            flux_L320              0.28  True
+torch_mem_eff            flux_L384              0.28  True
+torch_mem_eff            flux_L448              0.30  True
+torch_mem_eff            flux_L512              0.34  True
+xformers_meff            flux_L128              0.20  True
+xformers_meff            flux_L256              0.21  True
+xformers_meff            flux_L320              0.22  True
+xformers_meff            flux_L384              0.22  True
+xformers_meff            flux_L448              0.28  True
+xformers_meff            flux_L512              0.27  True
 
 GENERATING COMBINED VISUALIZATION
 
 Loaded 42 records
-✓ Combined visualization saved as latency.svg
+✓ Visualization saved as latency.svg
 Saved latency.png
-✓ Combined visualization saved as latency.svg
-✓ SVG visualization ready: latency.svg!
-
-ANALYSIS COMPLETE
-Total implementations analyzed: 7
-
-Implementations included:
-  ✓ Flash (PyTorch SDPA)
-  ✓ MemEff (PyTorch SDPA)
-  ✓ xFormers
-  ✓ Compiled (default)
-  ✓ Compiled (max-autotune)
-  ✓ HF Kernels Flash Attn
-  ✓ HF Kernels Flash Attn3
-✓ CSV export complete: latency.csv
-Total implementations: 7
-Total records: 42
-</div>
+✓ Visualization saved as latency.svg
+✓ SVG visualization ready!
+</pre></div>
 <div class="uv-install-logs" id="uv-logs-combine">
 <div class="uv-logs-header" onclick="toggleUvLogs(this)">▶ UV Install Logs</div>
 <div class="uv-logs-content" style="display: none;">
-   Updating https://github.com/drbh/kernels-benchmark-tools.git (main)
-Downloading nvidia-curand-cu12 (60.7MiB)
-Downloading sympy (6.0MiB)
-Downloading nvidia-cusolver-cu12 (255.1MiB)
-Downloading nvidia-cusparselt-cu12 (273.9MiB)
-Downloading nvidia-nccl-cu12 (307.4MiB)
-Downloading nvidia-cuda-nvrtc-cu12 (84.0MiB)
-Downloading nvidia-cufft-cu12 (184.2MiB)
-Downloading fonttools (4.7MiB)
-Downloading kiwisolver (1.4MiB)
-Downloading nvidia-cublas-cu12 (566.8MiB)
-Downloading nvidia-nvjitlink-cu12 (37.4MiB)
-Downloading matplotlib (8.3MiB)
-Downloading nvidia-cusparse-cu12 (274.9MiB)
-Downloading nvidia-cuda-cupti-cu12 (9.8MiB)
-Downloading setuptools (1.1MiB)
-Downloading networkx (1.9MiB)
-Downloading numpy (15.9MiB)
-Downloading pillow (6.3MiB)
-Downloading nvidia-cufile-cu12 (1.1MiB)
-Downloading torch (846.8MiB)
-Downloading triton (148.4MiB)
-Downloading nvidia-cudnn-cu12 (674.0MiB)
-    Updated https://github.com/drbh/kernels-benchmark-tools.git (f457279bca6573cd2fa54a74e67118f5e6b7a31c)
-   Building kernels-benchmark-tools @ git+https://github.com/drbh/kernels-benchmark-tools.git@f457279bca6573cd2fa54a74e67118f5e6b7a31c
- Downloading nvidia-cufile-cu12
- Downloading kiwisolver
- Downloading setuptools
- Downloading networkx
- Downloading fonttools
- Downloading pillow
-      Built kernels-benchmark-tools @ git+https://github.com/drbh/kernels-benchmark-tools.git@f457279bca6573cd2fa54a74e67118f5e6b7a31c
- Downloading matplotlib
- Downloading nvidia-cuda-cupti-cu12
- Downloading numpy
- Downloading nvidia-nvjitlink-cu12
- Downloading sympy
- Downloading nvidia-curand-cu12
- Downloading nvidia-cuda-nvrtc-cu12
- Downloading triton
- Downloading nvidia-cufft-cu12
- Downloading nvidia-cusolver-cu12
- Downloading nvidia-cusparse-cu12
- Downloading nvidia-cusparselt-cu12
- Downloading nvidia-nccl-cu12
- Downloading nvidia-cublas-cu12
- Downloading nvidia-cudnn-cu12
- Downloading torch
-Installed 37 packages in 256ms
+Installed 38 packages in 240ms
 </div>
 </div>
 <div class="cell-artifacts">
 <h4>Artifacts:</h4>
-<a href="artifacts/combine/latency.csv" class="artifact" target="_blank">latency.csv</a>
 <a href="artifacts/combine/latency.svg" class="artifact" target="_blank">latency.svg</a>
-<div class="artifact-preview artifact-csv">
-<table class="csv-table">
-<thead><tr>
-<th>Implementation</th>
-<th>Impl ID</th>
-<th>Workload</th>
-<th>Batch</th>
-<th>Seq Length</th>
-<th>Heads</th>
-<th>Head Dim</th>
-<th>Dtype</th>
-<th>Mean (ms)</th>
-<th>P10 (ms)</th>
-<th>P50 (ms)</th>
-<th>P90 (ms)</th>
-<th>Reps</th>
-<th>Peak Mem (MB)</th>
-<th>Backend</th>
-<th>Family</th>
-</tr></thead>
-<tbody>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.407123202085495</td>
-<td>0.40537598729133606</td>
-<td>0.40755200386047363</td>
-<td>0.407584011554718</td>
-<td>5</td>
-<td>83.38</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5235007882118226</td>
-<td>0.5212159752845764</td>
-<td>0.5232639908790588</td>
-<td>0.523360013961792</td>
-<td>5</td>
-<td>90.62</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.545849597454071</td>
-<td>0.5418559908866882</td>
-<td>0.5468159914016724</td>
-<td>0.5469120144844055</td>
-<td>5</td>
-<td>95.06</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5892416119575501</td>
-<td>0.5867519974708557</td>
-<td>0.5888000130653381</td>
-<td>0.5888000130653381</td>
-<td>5</td>
-<td>99.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6449280023574829</td>
-<td>0.6430720090866089</td>
-<td>0.6442239880561829</td>
-<td>0.6450240015983582</td>
-<td>5</td>
-<td>103.81</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Flash (PyTorch SDPA)</td>
-<td>torch_flash_ma</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6823423862457275</td>
-<td>0.6777600049972534</td>
-<td>0.6809599995613098</td>
-<td>0.6818559765815735</td>
-<td>5</td>
-<td>109.12</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.48371200561523436</td>
-<td>0.4821760058403015</td>
-<td>0.4833280146121979</td>
-<td>0.4853760004043579</td>
-<td>5</td>
-<td>83.38</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6268800020217895</td>
-<td>0.6246399879455566</td>
-<td>0.6266880035400391</td>
-<td>0.6286720037460327</td>
-<td>5</td>
-<td>90.62</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.699776005744934</td>
-<td>0.6973440051078796</td>
-<td>0.7004160284996033</td>
-<td>0.7004479765892029</td>
-<td>5</td>
-<td>95.94</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.8333312034606933</td>
-<td>0.8284159898757935</td>
-<td>0.8325120210647583</td>
-<td>0.8376320004463196</td>
-<td>5</td>
-<td>100.0</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.9533439993858337</td>
-<td>0.9502720236778259</td>
-<td>0.9512959718704224</td>
-<td>0.9572479724884033</td>
-<td>5</td>
-<td>103.81</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>MemEff (PyTorch SDPA)</td>
-<td>torch_mem_eff</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>1.0066367864608765</td>
-<td>1.0024960041046143</td>
-<td>1.0045440196990967</td>
-<td>1.0097919702529907</td>
-<td>5</td>
-<td>109.12</td>
-<td>EFFICIENT</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3452928066253662</td>
-<td>0.3389439880847931</td>
-<td>0.3461120128631592</td>
-<td>0.3461120128631592</td>
-<td>5</td>
-<td>83.38</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.41234560012817384</td>
-<td>0.40959998965263367</td>
-<td>0.41280001401901245</td>
-<td>0.41286399960517883</td>
-<td>5</td>
-<td>90.62</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4366208016872406</td>
-<td>0.4310399889945984</td>
-<td>0.4331519901752472</td>
-<td>0.4362240135669708</td>
-<td>5</td>
-<td>95.06</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4450624048709869</td>
-<td>0.4359680116176605</td>
-<td>0.44361600279808044</td>
-<td>0.447488009929657</td>
-<td>5</td>
-<td>99.88</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4750400006771088</td>
-<td>0.4711039960384369</td>
-<td>0.47513601183891296</td>
-<td>0.4763199985027313</td>
-<td>5</td>
-<td>103.81</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>xFormers</td>
-<td>xformers_meff</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5009407997131348</td>
-<td>0.49663999676704407</td>
-<td>0.4997119903564453</td>
-<td>0.5038080215454102</td>
-<td>5</td>
-<td>109.12</td>
-<td>memory_efficient</td>
-<td>xformers</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3856383919715881</td>
-<td>0.3563520014286041</td>
-<td>0.35942399501800537</td>
-<td>0.3624959886074066</td>
-<td>5</td>
-<td>83.38</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4982912003993988</td>
-<td>0.4926080107688904</td>
-<td>0.49663999676704407</td>
-<td>0.5017600059509277</td>
-<td>5</td>
-<td>90.62</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5369919896125793</td>
-<td>0.5335040092468262</td>
-<td>0.5366079807281494</td>
-<td>0.5386239886283875</td>
-<td>5</td>
-<td>95.25</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5841408014297486</td>
-<td>0.5775359869003296</td>
-<td>0.5868800282478333</td>
-<td>0.5877760052680969</td>
-<td>5</td>
-<td>99.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6184704065322876</td>
-<td>0.6072319746017456</td>
-<td>0.6113280057907104</td>
-<td>0.6144000291824341</td>
-<td>5</td>
-<td>103.81</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (default)</td>
-<td>torch_flash_compiled_default</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6428672075271606</td>
-<td>0.6399999856948853</td>
-<td>0.6430720090866089</td>
-<td>0.6430720090866089</td>
-<td>5</td>
-<td>109.12</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.40020479559898375</td>
-<td>0.3665919899940491</td>
-<td>0.3768320083618164</td>
-<td>0.41171199083328247</td>
-<td>5</td>
-<td>81.75</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.5535807967185974</td>
-<td>0.5160959959030151</td>
-<td>0.5489599704742432</td>
-<td>0.5631359815597534</td>
-<td>5</td>
-<td>92.88</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6143999934196472</td>
-<td>0.562175989151001</td>
-<td>0.6144000291824341</td>
-<td>0.6318079829216003</td>
-<td>5</td>
-<td>95.13</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.6754495978355408</td>
-<td>0.6512640118598938</td>
-<td>0.6584320068359375</td>
-<td>0.6799359917640686</td>
-<td>5</td>
-<td>97.13</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.7210752129554748</td>
-<td>0.6973119974136353</td>
-<td>0.7014080286026001</td>
-<td>0.7229440212249756</td>
-<td>5</td>
-<td>99.0</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>Compiled (max-autotune)</td>
-<td>torch_flash_compiled_max_autotune</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.7735359907150269</td>
-<td>0.7485439777374268</td>
-<td>0.7557439804077148</td>
-<td>0.7710719704627991</td>
-<td>5</td>
-<td>101.63</td>
-<td>FLASH</td>
-<td>torch-sdpa</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.2456959992647171</td>
-<td>0.24371199309825897</td>
-<td>0.24566400051116943</td>
-<td>0.2457599937915802</td>
-<td>5</td>
-<td>83.38</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3215551972389221</td>
-<td>0.3164159953594208</td>
-<td>0.319487988948822</td>
-<td>0.32051199674606323</td>
-<td>5</td>
-<td>90.62</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3384703993797302</td>
-<td>0.33670398592948914</td>
-<td>0.33792001008987427</td>
-<td>0.33983999490737915</td>
-<td>5</td>
-<td>95.06</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3510208010673523</td>
-<td>0.3481599986553192</td>
-<td>0.3491840064525604</td>
-<td>0.35225600004196167</td>
-<td>5</td>
-<td>99.88</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3829823970794678</td>
-<td>0.38095998764038086</td>
-<td>0.3829759955406189</td>
-<td>0.3840000033378601</td>
-<td>5</td>
-<td>103.81</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn</td>
-<td>hf_kernels_flash_attn</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4259391903877258</td>
-<td>0.4227519929409027</td>
-<td>0.4249599874019623</td>
-<td>0.4259839951992035</td>
-<td>5</td>
-<td>109.12</td>
-<td>flash-attn</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L128</td>
-<td>1</td>
-<td>1152</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.2755008041858673</td>
-<td>0.26736000180244446</td>
-<td>0.27561599016189575</td>
-<td>0.27955201268196106</td>
-<td>5</td>
-<td>83.38</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L256</td>
-<td>1</td>
-<td>1280</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.3397440016269684</td>
-<td>0.3368000090122223</td>
-<td>0.3399679958820343</td>
-<td>0.34191998839378357</td>
-<td>5</td>
-<td>90.62</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L320</td>
-<td>1</td>
-<td>1344</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.36019839644432067</td>
-<td>0.3563520014286041</td>
-<td>0.3604480028152466</td>
-<td>0.36137598752975464</td>
-<td>5</td>
-<td>95.06</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L384</td>
-<td>1</td>
-<td>1408</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.37342079877853396</td>
-<td>0.3718400001525879</td>
-<td>0.37379199266433716</td>
-<td>0.3746879994869232</td>
-<td>5</td>
-<td>99.88</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L448</td>
-<td>1</td>
-<td>1472</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4024448037147522</td>
-<td>0.3993600010871887</td>
-<td>0.4014720022678375</td>
-<td>0.4034560024738312</td>
-<td>5</td>
-<td>103.81</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-<tr>
-<td>HF Kernels Flash Attn3</td>
-<td>hf_kernels_flash_attn3</td>
-<td>flux_L512</td>
-<td>1</td>
-<td>1536</td>
-<td>24</td>
-<td>128</td>
-<td>bfloat16</td>
-<td>0.4305088043212891</td>
-<td>0.4270080029964447</td>
-<td>0.4291520118713379</td>
-<td>0.4331519901752472</td>
-<td>5</td>
-<td>109.12</td>
-<td>flash-attn3</td>
-<td>hf-kernels</td>
-</tr>
-</tbody>
-</table>
-</div>
 <div class="artifact-preview">
 <?xml version='1.0' encoding='utf-8'?>
 <svg xmlns="http://www.w3.org/2000/svg" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:ns2="http://creativecommons.org/ns#" xmlns:ns4="http://www.w3.org/1999/xlink" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" width="864pt" height="576pt" viewBox="0 0 864 576" version="1.1">
@@ -6800,7 +4408,7 @@ Installed 37 packages in 256ms
   <rdf:RDF>
    <ns2:Work>
     <dc:type rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
-    <dc:date>2025-10-14T20:47:15.973248</dc:date>
+    <dc:date>2025-10-23T17:22:40.731286</dc:date>
     <dc:format>image/svg+xml</dc:format>
     <dc:creator>
      <ns2:Agent>
@@ -6813,398 +4421,355 @@ Installed 37 packages in 256ms
  <defs>
   <style type="text/css">*{stroke-linejoin: round; stroke-linecap: butt}</style>
  </defs>
- <g id="figure--latency" class="figure">
+ <g id="figure--flash-attention" class="figure">
   <g id="patch_1">
    <path d="M 0 576  L 864 576  L 864 0  L 0 0  L 0 576  z " style="fill: none" />
   </g>
   <g id="axes--1" class="axes">
    <g id="patch_2">
-    <path d="M 47.72 502.746298  L 853.2 502.746298  L 853.2 26.88  L 47.72 26.88  L 47.72 502.746298  z " style="fill: none" />
+    <path d="M 54.02 502.746298  L 853.2 502.746298  L 853.2 26.88  L 54.02 26.88  L 54.02 502.746298  z " style="fill: none" />
    </g>
    <g id="matplotlib.axis_1">
     <g id="xtick_1">
      <g id="grid-x--1" class="grid grid-x">
-      <path d="M 84.332727 502.746298  L 84.332727 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 90.346364 502.746298  L 90.346364 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_1">
       <defs>
        <path id="mafb3703e5b" d="M 0 0  L 0 3.5  " style="stroke: #000000; stroke-width: 0.8" />
       </defs>
       <g>
-       <use ns4:href="#mafb3703e5b" x="84.332727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="90.346364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_1">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(69.139323 549.211696) rotate(-45)">flux_L128</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(75.152959 549.211696) rotate(-45)">flux_L128</text>
      </g>
     </g>
     <g id="xtick_2">
      <g id="grid-x--2" class="grid grid-x">
-      <path d="M 230.783636 502.746298  L 230.783636 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 235.651818 502.746298  L 235.651818 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_2">
       <g>
-       <use ns4:href="#mafb3703e5b" x="230.783636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="235.651818" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_2">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(215.590232 549.211696) rotate(-45)">flux_L256</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(220.458414 549.211696) rotate(-45)">flux_L256</text>
      </g>
     </g>
     <g id="xtick_3">
      <g id="grid-x--3" class="grid grid-x">
-      <path d="M 377.234545 502.746298  L 377.234545 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 380.957273 502.746298  L 380.957273 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_3">
       <g>
-       <use ns4:href="#mafb3703e5b" x="377.234545" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="380.957273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_3">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(362.041141 549.211696) rotate(-45)">flux_L320</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(365.763868 549.211696) rotate(-45)">flux_L320</text>
      </g>
     </g>
     <g id="xtick_4">
      <g id="grid-x--4" class="grid grid-x">
-      <path d="M 523.685455 502.746298  L 523.685455 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 526.262727 502.746298  L 526.262727 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_4">
       <g>
-       <use ns4:href="#mafb3703e5b" x="523.685455" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="526.262727" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_4">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(508.49205 549.211696) rotate(-45)">flux_L384</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(511.069323 549.211696) rotate(-45)">flux_L384</text>
      </g>
     </g>
     <g id="xtick_5">
      <g id="grid-x--5" class="grid grid-x">
-      <path d="M 670.136364 502.746298  L 670.136364 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 671.568182 502.746298  L 671.568182 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_5">
       <g>
-       <use ns4:href="#mafb3703e5b" x="670.136364" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="671.568182" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_5">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(654.942959 549.211696) rotate(-45)">flux_L448</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(656.374777 549.211696) rotate(-45)">flux_L448</text>
      </g>
     </g>
     <g id="xtick_6">
      <g id="grid-x--6" class="grid grid-x">
-      <path d="M 816.587273 502.746298  L 816.587273 26.88  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 816.873636 502.746298  L 816.873636 26.88  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_6">
       <g>
-       <use ns4:href="#mafb3703e5b" x="816.587273" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#mafb3703e5b" x="816.873636" y="502.746298" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_6">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.393868 549.211696) rotate(-45)">flux_L512</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif" transform="translate(801.680232 549.211696) rotate(-45)">flux_L512</text>
      </g>
     </g>
     <g id="label--x" class="xlabel">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="562.477358" transform="rotate(-0 450.46 562.477358)">Workload</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="453.61" y="562.477358" transform="rotate(-0 453.61 562.477358)">Workload</text>
     </g>
    </g>
    <g id="matplotlib.axis_2">
     <g id="ytick_1">
      <g id="grid-y--2" class="grid grid-y">
-      <path d="M 47.72 450.141334  L 853.2 450.141334  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 415.772525  L 853.2 415.772525  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_7">
       <defs>
        <path id="m0fca2865ba" d="M 0 0  L -3.5 0  " style="stroke: #000000; stroke-width: 0.8" />
       </defs>
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="450.141334" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="415.772525" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_7">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="453.940552" transform="rotate(-0 40.72 453.940552)">0.3</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="419.571744" transform="rotate(-0 47.02 419.571744)">0.15</text>
      </g>
     </g>
     <g id="ytick_2">
      <g id="grid-y--3" class="grid grid-y">
-      <path d="M 47.72 393.135521  L 853.2 393.135521  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 319.40707  L 853.2 319.40707  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_8">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="393.135521" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="319.40707" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_8">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="396.934739" transform="rotate(-0 40.72 396.934739)">0.4</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="323.206289" transform="rotate(-0 47.02 323.206289)">0.20</text>
      </g>
     </g>
     <g id="ytick_3">
      <g id="grid-y--4" class="grid grid-y">
-      <path d="M 47.72 336.129707  L 853.2 336.129707  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 223.041616  L 853.2 223.041616  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_9">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="336.129707" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="223.041616" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_9">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="339.928926" transform="rotate(-0 40.72 339.928926)">0.5</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="226.840834" transform="rotate(-0 47.02 226.840834)">0.25</text>
      </g>
     </g>
     <g id="ytick_4">
      <g id="grid-y--5" class="grid grid-y">
-      <path d="M 47.72 279.123894  L 853.2 279.123894  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 126.676161  L 853.2 126.676161  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_10">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="279.123894" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="126.676161" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_10">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="282.923113" transform="rotate(-0 40.72 282.923113)">0.6</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="130.47538" transform="rotate(-0 47.02 130.47538)">0.30</text>
      </g>
     </g>
     <g id="ytick_5">
      <g id="grid-y--6" class="grid grid-y">
-      <path d="M 47.72 222.118081  L 853.2 222.118081  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
+      <path d="M 54.02 30.310707  L 853.2 30.310707  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
      </g>
      <g id="line2d_11">
       <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="222.118081" style="stroke: #000000; stroke-width: 0.8" />
+       <use ns4:href="#m0fca2865ba" x="54.02" y="30.310707" style="stroke: #000000; stroke-width: 0.8" />
       </g>
      </g>
      <g id="text_11">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="225.9173" transform="rotate(-0 40.72 225.9173)">0.7</text>
-     </g>
-    </g>
-    <g id="ytick_6">
-     <g id="grid-y--7" class="grid grid-y">
-      <path d="M 47.72 165.112268  L 853.2 165.112268  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_12">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="165.112268" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_12">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="168.911487" transform="rotate(-0 40.72 168.911487)">0.8</text>
-     </g>
-    </g>
-    <g id="ytick_7">
-     <g id="grid-y--8" class="grid grid-y">
-      <path d="M 47.72 108.106455  L 853.2 108.106455  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_13">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="108.106455" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_13">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="111.905674" transform="rotate(-0 40.72 111.905674)">0.9</text>
-     </g>
-    </g>
-    <g id="ytick_8">
-     <g id="grid-y--9" class="grid grid-y">
-      <path d="M 47.72 51.100642  L 853.2 51.100642  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #b0b0b0; stroke-opacity: 0.3; stroke-width: 0.8; stroke-linecap: square" />
-     </g>
-     <g id="line2d_14">
-      <g>
-       <use ns4:href="#m0fca2865ba" x="47.72" y="51.100642" style="stroke: #000000; stroke-width: 0.8" />
-      </g>
-     </g>
-     <g id="text_14">
-      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="40.72" y="54.89986" transform="rotate(-0 40.72 54.89986)">1.0</text>
+      <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: end" x="47.02" y="34.109925" transform="rotate(-0 47.02 34.109925)">0.35</text>
      </g>
     </g>
     <g id="label--y" class="ylabel">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.737188" y="264.813149" transform="rotate(-90 18.737188 264.813149)">Latency P50 (ms)</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="18.674687" y="264.813149" transform="rotate(-90 18.674687 264.813149)">Latency P50 (ms)</text>
     </g>
    </g>
    <g id="series--torch-flash-ma" class="series">
-    <path d="M 84.332727 388.830439  L 230.783636 322.86788  L 377.234545 309.441871  L 523.685455 285.508538  L 670.136364 253.91365  L 816.587273 232.971988  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 356.83734  L 235.651818 302.774393  L 380.957273 272.879902  L 526.262727 285.428611  L 671.568182 180.710199  L 816.873636 163.520529  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="md7efaf3aec" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #1f77b4" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#md7efaf3aec" x="84.332727" y="388.830439" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="230.783636" y="322.86788" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="377.234545" y="309.441871" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="523.685455" y="285.508538" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="670.136364" y="253.91365" style="fill: #1f77b4; stroke: #1f77b4" />
-     <use ns4:href="#md7efaf3aec" x="816.587273" y="232.971988" style="fill: #1f77b4; stroke: #1f77b4" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#md7efaf3aec" x="90.346364" y="356.83734" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="235.651818" y="302.774393" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="380.957273" y="272.879902" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="526.262727" y="285.428611" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="671.568182" y="180.710199" style="fill: #1f77b4; stroke: #1f77b4" />
+     <use ns4:href="#md7efaf3aec" x="816.873636" y="163.520529" style="fill: #1f77b4; stroke: #1f77b4" />
     </g>
    </g>
    <g id="series--torch-mem-eff" class="series">
-    <path d="M 84.332727 345.633708  L 230.783636 263.910181  L 377.234545 221.880921  L 523.685455 146.578526  L 670.136364 78.864769  L 816.587273 48.510286  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 263.031352  L 235.651818 201.604157  L 380.957273 165.291726  L 526.262727 162.400762  L 671.568182 135.418435  L 816.873636 48.510286  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m9b8c54d372" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #ff7f0e" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m9b8c54d372" x="84.332727" y="345.633708" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="230.783636" y="263.910181" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="377.234545" y="221.880921" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="523.685455" y="146.578526" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="670.136364" y="78.864769" style="fill: #ff7f0e; stroke: #ff7f0e" />
-     <use ns4:href="#m9b8c54d372" x="816.587273" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m9b8c54d372" x="90.346364" y="263.031352" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="235.651818" y="201.604157" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="380.957273" y="165.291726" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="526.262727" y="162.400762" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="671.568182" y="135.418435" style="fill: #ff7f0e; stroke: #ff7f0e" />
+     <use ns4:href="#m9b8c54d372" x="816.873636" y="48.510286" style="fill: #ff7f0e; stroke: #ff7f0e" />
     </g>
    </g>
    <g id="series--xformers-meff" class="series">
-    <path d="M 84.332727 423.854806  L 230.783636 385.838768  L 377.234545 374.236959  L 523.685455 368.271864  L 670.136364 350.303626  L 816.587273 336.29389  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 325.844283  L 235.651818 302.986397  L 380.957273 280.880162  L 526.262727 283.327844  L 671.568182 172.480589  L 816.873636 176.915327  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="mc655281e0b" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #2ca02c" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#mc655281e0b" x="84.332727" y="423.854806" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="230.783636" y="385.838768" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="377.234545" y="374.236959" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="523.685455" y="368.271864" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="670.136364" y="350.303626" style="fill: #2ca02c; stroke: #2ca02c" />
-     <use ns4:href="#mc655281e0b" x="816.587273" y="336.29389" style="fill: #2ca02c; stroke: #2ca02c" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#mc655281e0b" x="90.346364" y="325.844283" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="235.651818" y="302.986397" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="380.957273" y="280.880162" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="526.262727" y="283.327844" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="671.568182" y="172.480589" style="fill: #2ca02c; stroke: #2ca02c" />
+     <use ns4:href="#mc655281e0b" x="816.873636" y="176.915327" style="fill: #2ca02c; stroke: #2ca02c" />
     </g>
    </g>
    <g id="series--torch-flash-compiled-default" class="series">
-    <path d="M 84.332727 416.266202  L 230.783636 338.045105  L 377.234545 315.26103  L 523.685455 286.603041  L 670.136364 272.666272  L 816.587273 254.570345  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 316.922768  L 235.651818 262.221882  L 380.957273 251.872232  L 526.262727 244.62555  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m61c8040d7e" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #d62728" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m61c8040d7e" x="84.332727" y="416.266202" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="230.783636" y="338.045105" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="377.234545" y="315.26103" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="523.685455" y="286.603041" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="670.136364" y="272.666272" style="fill: #d62728; stroke: #d62728" />
-     <use ns4:href="#m61c8040d7e" x="816.587273" y="254.570345" style="fill: #d62728; stroke: #d62728" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m61c8040d7e" x="90.346364" y="316.922768" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="235.651818" y="262.221882" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="380.957273" y="251.872232" style="fill: #d62728; stroke: #d62728" />
+     <use ns4:href="#m61c8040d7e" x="526.262727" y="244.62555" style="fill: #d62728; stroke: #d62728" />
     </g>
    </g>
    <g id="series--torch-flash-compiled-max-autotune" class="series">
-    <path d="M 84.332727 406.342623  L 230.783636 308.219678  L 377.234545 270.915041  L 523.685455 245.814254  L 670.136364 221.315423  L 816.587273 190.340772  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 338.660888  L 235.651818 322.876226  L 380.957273 301.155453  L 526.262727 294.024409  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m7cd35be9cc" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #9467bd" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m7cd35be9cc" x="84.332727" y="406.342623" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="230.783636" y="308.219678" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="377.234545" y="270.915041" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="523.685455" y="245.814254" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="670.136364" y="221.315423" style="fill: #9467bd; stroke: #9467bd" />
-     <use ns4:href="#m7cd35be9cc" x="816.587273" y="190.340772" style="fill: #9467bd; stroke: #9467bd" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m7cd35be9cc" x="90.346364" y="338.660888" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="235.651818" y="322.876226" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="380.957273" y="301.155453" style="fill: #9467bd; stroke: #9467bd" />
+     <use ns4:href="#m7cd35be9cc" x="526.262727" y="294.024409" style="fill: #9467bd; stroke: #9467bd" />
     </g>
    </g>
    <g id="series--hf-kernels-flash-attn" class="series">
-    <path d="M 84.332727 481.116012  L 230.783636 439.032047  L 377.234545 428.524724  L 523.685455 422.103591  L 670.136364 402.840193  L 816.587273 378.906877  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 481.116012  L 235.651818 443.589377  L 380.957273 429.674205  L 526.262727 424.217993  L 671.568182 324.726443  L 816.873636 319.599801  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m5dea31a887" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #8c564b" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m5dea31a887" x="84.332727" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="230.783636" y="439.032047" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="377.234545" y="428.524724" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="523.685455" y="422.103591" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="670.136364" y="402.840193" style="fill: #8c564b; stroke: #8c564b" />
-     <use ns4:href="#m5dea31a887" x="816.587273" y="378.906877" style="fill: #8c564b; stroke: #8c564b" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m5dea31a887" x="90.346364" y="481.116012" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="235.651818" y="443.589377" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="380.957273" y="429.674205" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="526.262727" y="424.217993" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="671.568182" y="324.726443" style="fill: #8c564b; stroke: #8c564b" />
+     <use ns4:href="#m5dea31a887" x="816.873636" y="319.599801" style="fill: #8c564b; stroke: #8c564b" />
     </g>
    </g>
    <g id="series--hf-kernels-flash-attn3" class="series">
-    <path d="M 84.332727 464.041637  L 230.783636 427.357253  L 377.234545 415.682458  L 523.685455 408.075608  L 670.136364 392.296394  L 816.587273 376.517179  " clip-path="url(#p5d73e4651f)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <path d="M 90.346364 447.09708  L 235.651818 414.602648  L 380.957273 398.006589  L 526.262727 395.346903  L 671.568182 297.898301  L 816.873636 291.692366  " clip-path="url(#p19de80d412)" style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
     <defs>
      <path id="m67b69c36d7" d="M 0 3  C 0.795609 3 1.55874 2.683901 2.12132 2.12132  C 2.683901 1.55874 3 0.795609 3 0  C 3 -0.795609 2.683901 -1.55874 2.12132 -2.12132  C 1.55874 -2.683901 0.795609 -3 0 -3  C -0.795609 -3 -1.55874 -2.683901 -2.12132 -2.12132  C -2.683901 -1.55874 -3 -0.795609 -3 0  C -3 0.795609 -2.683901 1.55874 -2.12132 2.12132  C -1.55874 2.683901 -0.795609 3 0 3  z " style="stroke: #e377c2" />
     </defs>
-    <g clip-path="url(#p5d73e4651f)">
-     <use ns4:href="#m67b69c36d7" x="84.332727" y="464.041637" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="230.783636" y="427.357253" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="377.234545" y="415.682458" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="523.685455" y="408.075608" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="670.136364" y="392.296394" style="fill: #e377c2; stroke: #e377c2" />
-     <use ns4:href="#m67b69c36d7" x="816.587273" y="376.517179" style="fill: #e377c2; stroke: #e377c2" />
+    <g clip-path="url(#p19de80d412)">
+     <use ns4:href="#m67b69c36d7" x="90.346364" y="447.09708" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="235.651818" y="414.602648" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="380.957273" y="398.006589" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="526.262727" y="395.346903" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="671.568182" y="297.898301" style="fill: #e377c2; stroke: #e377c2" />
+     <use ns4:href="#m67b69c36d7" x="816.873636" y="291.692366" style="fill: #e377c2; stroke: #e377c2" />
     </g>
    </g>
    <g id="patch_3">
-    <path d="M 47.72 502.746298  L 47.72 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 502.746298  L 54.02 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_4">
     <path d="M 853.2 502.746298  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_5">
-    <path d="M 47.72 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 502.746298  L 853.2 502.746298  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
    <g id="patch_6">
-    <path d="M 47.72 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
+    <path d="M 54.02 26.88  L 853.2 26.88  " style="fill: none; stroke: #000000; stroke-width: 0.8; stroke-linejoin: miter; stroke-linecap: square" />
    </g>
-   <g id="text_15">
-    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="450.46" y="20.88" transform="rotate(-0 450.46 20.88)">Attention Implementation Latency</text>
+   <g id="text_12">
+    <text style="font-size: 12px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: middle" x="453.61" y="20.88" transform="rotate(-0 453.61 20.88)">Attention Implementation Latency</text>
    </g>
    <g id="legend" class="legend">
     <g id="patch_7">
-     <path d="M 54.72 139.57375  L 269.259063 139.57375  Q 271.259063 139.57375 271.259063 137.57375  L 271.259063 33.88  Q 271.259063 31.88 269.259063 31.88  L 54.72 31.88  Q 52.72 31.88 52.72 33.88  L 52.72 137.57375  Q 52.72 139.57375 54.72 139.57375  L 54.72 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
+     <path d="M 61.02 139.57375  L 275.559062 139.57375  Q 277.559062 139.57375 277.559062 137.57375  L 277.559062 33.88  Q 277.559062 31.88 275.559062 31.88  L 61.02 31.88  Q 59.02 31.88 59.02 33.88  L 59.02 137.57375  Q 59.02 139.57375 61.02 139.57375  L 61.02 139.57375  z " style="fill: none; opacity: 0.8; stroke: #cccccc; stroke-linejoin: miter" />
     </g>
-    <g id="line2d_15">
-     <path d="M 56.72 39.978438  L 66.72 39.978438  L 76.72 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_12">
+     <path d="M 63.02 39.978438  L 73.02 39.978438  L 83.02 39.978438  " style="fill: none; stroke: #1f77b4; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#md7efaf3aec" x="66.72" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
+      <use ns4:href="#md7efaf3aec" x="73.02" y="39.978438" style="fill: #1f77b4; stroke: #1f77b4" />
      </g>
     </g>
     <g id="legend-label--torch-flash-ma" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="43.478438" transform="rotate(-0 84.72 43.478438)">torch_flash_ma</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="43.478438" transform="rotate(-0 91.02 43.478438)">torch_flash_ma</text>
     </g>
-    <g id="line2d_16">
-     <path d="M 56.72 54.934687  L 66.72 54.934687  L 76.72 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_13">
+     <path d="M 63.02 54.934687  L 73.02 54.934687  L 83.02 54.934687  " style="fill: none; stroke: #ff7f0e; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m9b8c54d372" x="66.72" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
+      <use ns4:href="#m9b8c54d372" x="73.02" y="54.934687" style="fill: #ff7f0e; stroke: #ff7f0e" />
      </g>
     </g>
     <g id="legend-label--torch-mem-eff" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="58.434687" transform="rotate(-0 84.72 58.434687)">torch_mem_eff</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="58.434687" transform="rotate(-0 91.02 58.434687)">torch_mem_eff</text>
     </g>
-    <g id="line2d_17">
-     <path d="M 56.72 69.890938  L 66.72 69.890938  L 76.72 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_14">
+     <path d="M 63.02 69.890938  L 73.02 69.890938  L 83.02 69.890938  " style="fill: none; stroke: #2ca02c; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#mc655281e0b" x="66.72" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
+      <use ns4:href="#mc655281e0b" x="73.02" y="69.890938" style="fill: #2ca02c; stroke: #2ca02c" />
      </g>
     </g>
     <g id="legend-label--xformers-meff" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="73.390938" transform="rotate(-0 84.72 73.390938)">xformers_meff</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="73.390938" transform="rotate(-0 91.02 73.390938)">xformers_meff</text>
     </g>
-    <g id="line2d_18">
-     <path d="M 56.72 84.847188  L 66.72 84.847188  L 76.72 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_15">
+     <path d="M 63.02 84.847188  L 73.02 84.847188  L 83.02 84.847188  " style="fill: none; stroke: #d62728; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m61c8040d7e" x="66.72" y="84.847188" style="fill: #d62728; stroke: #d62728" />
+      <use ns4:href="#m61c8040d7e" x="73.02" y="84.847188" style="fill: #d62728; stroke: #d62728" />
      </g>
     </g>
     <g id="legend-label--torch-flash-compiled-default" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="88.347188" transform="rotate(-0 84.72 88.347188)">torch_flash_compiled_default</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="88.347188" transform="rotate(-0 91.02 88.347188)">torch_flash_compiled_default</text>
     </g>
-    <g id="line2d_19">
-     <path d="M 56.72 99.803438  L 66.72 99.803438  L 76.72 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_16">
+     <path d="M 63.02 99.803438  L 73.02 99.803438  L 83.02 99.803438  " style="fill: none; stroke: #9467bd; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m7cd35be9cc" x="66.72" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
+      <use ns4:href="#m7cd35be9cc" x="73.02" y="99.803438" style="fill: #9467bd; stroke: #9467bd" />
      </g>
     </g>
     <g id="legend-label--torch-flash-compiled-max-autotune" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="103.303438" transform="rotate(-0 84.72 103.303438)">torch_flash_compiled_max_autotune</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="103.303438" transform="rotate(-0 91.02 103.303438)">torch_flash_compiled_max_autotune</text>
     </g>
-    <g id="line2d_20">
-     <path d="M 56.72 114.759688  L 66.72 114.759688  L 76.72 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_17">
+     <path d="M 63.02 114.759688  L 73.02 114.759688  L 83.02 114.759688  " style="fill: none; stroke: #8c564b; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m5dea31a887" x="66.72" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
+      <use ns4:href="#m5dea31a887" x="73.02" y="114.759688" style="fill: #8c564b; stroke: #8c564b" />
      </g>
     </g>
     <g id="legend-label--hf-kernels-flash-attn" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="118.259688" transform="rotate(-0 84.72 118.259688)">hf_kernels_flash_attn</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="118.259688" transform="rotate(-0 91.02 118.259688)">hf_kernels_flash_attn</text>
     </g>
-    <g id="line2d_21">
-     <path d="M 56.72 129.715938  L 66.72 129.715938  L 76.72 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
+    <g id="line2d_18">
+     <path d="M 63.02 129.715938  L 73.02 129.715938  L 83.02 129.715938  " style="fill: none; stroke: #e377c2; stroke-width: 1.5; stroke-linecap: square" />
      <g>
-      <use ns4:href="#m67b69c36d7" x="66.72" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
+      <use ns4:href="#m67b69c36d7" x="73.02" y="129.715938" style="fill: #e377c2; stroke: #e377c2" />
      </g>
     </g>
     <g id="legend-label--hf-kernels-flash-attn3" class="legend">
-     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="84.72" y="133.215938" transform="rotate(-0 84.72 133.215938)">hf_kernels_flash_attn3</text>
+     <text style="font-size: 10px; font-family: 'DejaVu Sans', 'Bitstream Vera Sans', 'Computer Modern Sans Serif', 'Lucida Grande', 'Verdana', 'Geneva', 'Lucid', 'Arial', 'Helvetica', 'Avant Garde', sans-serif; text-anchor: start" x="91.02" y="133.215938" transform="rotate(-0 91.02 133.215938)">hf_kernels_flash_attn3</text>
     </g>
    </g>
   </g>
  </g>
  <defs>
-  <clipPath id="p5d73e4651f">
-   <rect x="47.72" y="26.88" width="805.48" height="475.866298" />
+  <clipPath id="p19de80d412">
+   <rect x="54.02" y="26.88" width="799.18" height="475.866298" />
   </clipPath>
  </defs>
 </svg>
@@ -7212,160 +4777,6 @@ Installed 37 packages in 256ms
 </div>
 </div>
 </div>
-
-<script>
-// Configuration object mapping series IDs to their URLs and descriptions
-const seriesConfig = {
-    'series--torch-flash-ma': {
-        url: '../impls/flash_attention.html',
-        name: 'PyTorch Flash Attention (Math)',
-        description: 'PyTorch built-in scaled dot product attention with math backend'
-    },
-    'series--torch-mem-eff': {
-        url: '../impls/mem_efficient_attention.html',
-        name: 'PyTorch Memory Efficient',
-        description: 'PyTorch memory-efficient attention implementation'
-    },
-    'series--xformers-meff': {
-        url: '../impls/xformers.html',
-        name: 'xFormers Memory Efficient',
-        description: 'Facebook Research xFormers memory-efficient attention'
-    },
-    'series--torch-flash-compiled-default': {
-        url: '../impls/compiled_variants.html',
-        name: 'PyTorch Flash Compiled (Default)',
-        description: 'PyTorch compiled Flash Attention with default settings'
-    },
-    'series--torch-flash-compiled-max-autotune': {
-        url: '../impls/compiled_variants.html',
-        name: 'PyTorch Flash Compiled (Max Autotune)',
-        description: 'PyTorch compiled Flash Attention with maximum auto-tuning'
-    },
-    'series--hf-kernels-flash-attn': {
-        url: '../impls/hf_kernels_flash_attn.html',
-        name: 'HuggingFace Flash Attention',
-        description: 'HuggingFace kernels implementation of Flash Attention'
-    },
-    'series--hf-kernels-flash-attn3': {
-        url: '../impls/hf_kernels_flash_attn3.html',
-        name: 'HuggingFace Flash Attention 3',
-        description: 'HuggingFace kernels implementation of Flash Attention 3'
-    }
-};
-
-// Get tooltip element (create if it doesn't exist)
-let tooltip = document.getElementById('tooltip');
-if (!tooltip) {
-    tooltip = document.createElement('div');
-    tooltip.id = 'tooltip';
-    tooltip.className = 'tooltip';
-    document.body.appendChild(tooltip);
-}
-
-// Add event listeners to each series
-Object.keys(seriesConfig).forEach(seriesId => {
-    const seriesElement = document.getElementById(seriesId);
-    const config = seriesConfig[seriesId];
-
-    if (seriesElement) {
-        // Mouse enter - show tooltip
-        seriesElement.addEventListener('mouseenter', (e) => {
-            tooltip.innerHTML = `
-                <strong>${config.name}</strong><br>
-                <span style="font-size: 12px; opacity: 0.9;">${config.description}</span><br>
-                <span style="font-size: 11px; opacity: 0.7;">Click to view documentation</span>
-            `;
-            tooltip.classList.add('show');
-        });
-
-        // Mouse move - update tooltip position
-        seriesElement.addEventListener('mousemove', (e) => {
-            const rect = document.querySelector('svg').getBoundingClientRect();
-            tooltip.style.left = (e.clientX + 15) + 'px';
-            tooltip.style.top = (e.clientY - 10) + 'px';
-        });
-
-        // Mouse leave - hide tooltip
-        seriesElement.addEventListener('mouseleave', () => {
-            tooltip.classList.remove('show');
-        });
-
-        // Click - open URL in new tab
-        seriesElement.addEventListener('click', (e) => {
-            e.preventDefault();
-            window.open(config.url, '_blank', 'noopener,noreferrer');
-
-            // Optional: Add visual feedback for click
-            seriesElement.style.transform = 'scale(0.98)';
-            setTimeout(() => {
-                seriesElement.style.transform = '';
-            }, 150);
-        });
-
-        // Add cursor pointer style
-        seriesElement.style.cursor = 'pointer';
-    }
-});
-
-// Also add click handlers to legend items
-const legendLabels = document.querySelectorAll('[id^="legend-label--"]');
-legendLabels.forEach(label => {
-    const labelId = label.id.replace('legend-label--', 'series--');
-    const config = seriesConfig[labelId];
-
-    if (config) {
-        label.style.cursor = 'pointer';
-
-        label.addEventListener('click', (e) => {
-            e.preventDefault();
-            window.open(config.url, '_blank', 'noopener,noreferrer');
-        });
-
-        label.addEventListener('mouseenter', (e) => {
-            tooltip.innerHTML = `
-                <strong>${config.name}</strong><br>
-                <span style="font-size: 12px; opacity: 0.9;">${config.description}</span><br>
-                <span style="font-size: 11px; opacity: 0.7;">Click to view documentation</span>
-            `;
-            tooltip.classList.add('show');
-        });
-
-        label.addEventListener('mousemove', (e) => {
-            tooltip.style.left = (e.clientX + 15) + 'px';
-            tooltip.style.top = (e.clientY - 10) + 'px';
-        });
-
-        label.addEventListener('mouseleave', () => {
-            tooltip.classList.remove('show');
-        });
-    }
-});
-
-// Keyboard accessibility - Enter key support
-document.addEventListener('keydown', (e) => {
-    if (e.key === 'Enter' && e.target.closest('[id^="series--"]')) {
-        const seriesId = e.target.closest('[id^="series--"]').id;
-        const config = seriesConfig[seriesId];
-        if (config) {
-            window.open(config.url, '_blank', 'noopener,noreferrer');
-        }
-    }
-});
-
-// Add focus styles for keyboard navigation
-const allInteractiveElements = document.querySelectorAll('[id^="series--"], [id^="legend-label--"]');
-allInteractiveElements.forEach(element => {
-    element.setAttribute('tabindex', '0');
-    element.addEventListener('focus', () => {
-        element.style.outline = '2px solid #007acc';
-        element.style.outlineOffset = '2px';
-    });
-    element.addEventListener('blur', () => {
-        element.style.outline = '';
-        element.style.outlineOffset = '';
-    });
-});
-</script>
     </div>
     
 </body>