Spaces:

riazmo
/

design-system-extractor

Runtime error

App Files Files Community

riazmo commited on Jan 24

Commit

17a7a81

verified ·

1 Parent(s): ba25cd5

Delete app.py

Browse files

Files changed (1) hide show

app.py +0 -395

app.py DELETED Viewed

@@ -1,395 +0,0 @@
-"""
-Design System Extractor v2 — Main Application
-==============================================
-A semi-automated, human-in-the-loop agentic system that reverse-engineers
-design systems from live websites.
-Usage:
-    python app.py
-Or for development:
-    gradio app.py
-"""
-import asyncio
-import gradio as gr
-from datetime import datetime
-from agents.graph import WorkflowRunner, create_workflow
-from agents.crawler import PageDiscoverer, discover_pages
-from agents.extractor import TokenExtractor
-from core.token_schema import Viewport, DiscoveredPage
-from config.settings import get_settings, is_debug
-# =============================================================================
-# GLOBAL STATE
-# =============================================================================
-workflow_runner: WorkflowRunner | None = None
-current_extraction: dict = {}
-# =============================================================================
-# STAGE 1: URL INPUT & PAGE DISCOVERY
-# =============================================================================
-async def discover_site_pages(url: str, progress=gr.Progress()) -> tuple:
-    """
-    Discover pages from a website URL.
-    Returns tuple of (status_message, pages_dataframe, pages_json)
-    """
-    if not url or not url.startswith(("http://", "https://")):
-        return "Please enter a valid URL starting with http:// or https://", None, None
-    progress(0, desc="Initializing browser...")
-    try:
-        discoverer = PageDiscoverer()
-        def update_progress(p):
-            progress(p, desc=f"Discovering pages... ({int(p*100)}%)")
-        pages = await discoverer.discover(url, progress_callback=update_progress)
-        # Format for display
-        pages_data = []
-        for page in pages:
-            pages_data.append({
-                "Select": page.selected,
-                "URL": page.url,
-                "Title": page.title or "(No title)",
-                "Type": page.page_type.value,
-                "Status": "✓" if not page.error else f"⚠ {page.error}",
-            })
-        # Store for later use
-        current_extraction["discovered_pages"] = pages
-        current_extraction["base_url"] = url
-        status = f"✓ Found {len(pages)} pages. Select the pages you want to extract tokens from."
-        return status, pages_data, [p.model_dump() for p in pages]
-    except Exception as e:
-        return f"❌ Error: {str(e)}", None, None
-async def start_extraction(pages_selection: list, viewport_choice: str, progress=gr.Progress()) -> tuple:
-    """
-    Start token extraction from selected pages.
-    Returns tuple of (status, colors_data, typography_data, spacing_data)
-    """
-    if not pages_selection:
-        return "Please select at least one page", None, None, None
-    # Get selected URLs
-    selected_urls = []
-    for row in pages_selection:
-        if row.get("Select", False):
-            selected_urls.append(row["URL"])
-    if not selected_urls:
-        return "Please select at least one page using the checkboxes", None, None, None
-    # Determine viewport
-    viewport = Viewport.DESKTOP if viewport_choice == "Desktop (1440px)" else Viewport.MOBILE
-    progress(0, desc=f"Starting {viewport.value} extraction...")
-    try:
-        extractor = TokenExtractor(viewport=viewport)
-        def update_progress(p):
-            progress(p, desc=f"Extracting tokens... ({int(p*100)}%)")
-        result = await extractor.extract(selected_urls, progress_callback=update_progress)
-        # Store result
-        current_extraction[f"{viewport.value}_tokens"] = result
-        # Format colors for display
-        colors_data = []
-        for color in sorted(result.colors, key=lambda c: -c.frequency)[:50]:
-            colors_data.append({
-                "Accept": True,
-                "Color": color.value,
-                "Frequency": color.frequency,
-                "Context": ", ".join(color.contexts[:3]),
-                "Contrast (White)": f"{color.contrast_white}:1",
-                "AA Text": "✓" if color.wcag_aa_small_text else "✗",
-                "Confidence": color.confidence.value,
-            })
-        # Format typography for display
-        typography_data = []
-        for typo in sorted(result.typography, key=lambda t: -t.frequency)[:30]:
-            typography_data.append({
-                "Accept": True,
-                "Font": typo.font_family,
-                "Size": typo.font_size,
-                "Weight": typo.font_weight,
-                "Line Height": typo.line_height,
-                "Elements": ", ".join(typo.elements[:3]),
-                "Frequency": typo.frequency,
-            })
-        # Format spacing for display
-        spacing_data = []
-        for space in sorted(result.spacing, key=lambda s: s.value_px)[:20]:
-            spacing_data.append({
-                "Accept": True,
-                "Value": space.value,
-                "Frequency": space.frequency,
-                "Context": ", ".join(space.contexts[:2]),
-                "Fits 8px": "✓" if space.fits_base_8 else "",
-                "Outlier": "⚠" if space.is_outlier else "",
-            })
-        # Summary
-        status = f"""✓ Extraction Complete ({viewport.value})
-**Summary:**
-- Pages crawled: {len(result.pages_crawled)}
-- Colors found: {len(result.colors)}
-- Typography styles: {len(result.typography)}
-- Spacing values: {len(result.spacing)}
-- Font families: {len(result.font_families)}
-- Detected spacing base: {result.spacing_base or 'Unknown'}px
-- Duration: {result.extraction_duration_ms}ms
-{f'⚠ Warnings: {len(result.warnings)}' if result.warnings else ''}
-{f'❌ Errors: {len(result.errors)}' if result.errors else ''}
-"""
-        return status, colors_data, typography_data, spacing_data
-    except Exception as e:
-        return f"❌ Extraction failed: {str(e)}", None, None, None
-def export_tokens_json():
-    """Export current tokens to JSON."""
-    import json
-    result = {}
-    if "desktop_tokens" in current_extraction:
-        desktop = current_extraction["desktop_tokens"]
-        result["desktop"] = {
-            "colors": [c.model_dump() for c in desktop.colors],
-            "typography": [t.model_dump() for t in desktop.typography],
-            "spacing": [s.model_dump() for s in desktop.spacing],
-            "metadata": desktop.summary(),
-        }
-    if "mobile_tokens" in current_extraction:
-        mobile = current_extraction["mobile_tokens"]
-        result["mobile"] = {
-            "colors": [c.model_dump() for c in mobile.colors],
-            "typography": [t.model_dump() for t in mobile.typography],
-            "spacing": [s.model_dump() for s in mobile.spacing],
-            "metadata": mobile.summary(),
-        }
-    return json.dumps(result, indent=2, default=str)
-# =============================================================================
-# UI BUILDING
-# =============================================================================
-def create_ui():
-    """Create the Gradio interface."""
-    settings = get_settings()
-    with gr.Blocks(
-        title="Design System Extractor v2",
-        theme=gr.themes.Soft(),
-        css="""
-        .token-preview { padding: 10px; border-radius: 8px; }
-        .color-swatch { width: 40px; height: 40px; border-radius: 4px; display: inline-block; }
-        """
-    ) as app:
-        # Header
-        gr.Markdown("""
-        # 🎨 Design System Extractor v2
-        **Reverse-engineer design systems from live websites.**
-        This tool crawls your website, extracts design tokens (colors, typography, spacing),
-        and helps you rebuild a structured design system.
-        ---
-        """)
-        # =================================================================
-        # STAGE 1: URL Input & Discovery
-        # =================================================================
-        with gr.Accordion("📍 Stage 1: Website Discovery", open=True):
-            gr.Markdown("""
-            **Step 1:** Enter your website URL and discover pages.
-            The system will automatically find and classify pages for extraction.
-            """)
-            with gr.Row():
-                url_input = gr.Textbox(
-                    label="Website URL",
-                    placeholder="https://example.com",
-                    scale=4,
-                )
-                discover_btn = gr.Button("🔍 Discover Pages", variant="primary", scale=1)
-            discovery_status = gr.Markdown("")
-            pages_table = gr.Dataframe(
-                headers=["Select", "URL", "Title", "Type", "Status"],
-                datatype=["bool", "str", "str", "str", "str"],
-                interactive=True,
-                label="Discovered Pages",
-                visible=False,
-            )
-            pages_json = gr.JSON(visible=False)  # Hidden storage
-        # =================================================================
-        # STAGE 2: Extraction
-        # =================================================================
-        with gr.Accordion("🔬 Stage 2: Token Extraction", open=False) as extraction_accordion:
-            gr.Markdown("""
-            **Step 2:** Select pages and viewport, then extract design tokens.
-            """)
-            with gr.Row():
-                viewport_radio = gr.Radio(
-                    choices=["Desktop (1440px)", "Mobile (375px)"],
-                    value="Desktop (1440px)",
-                    label="Viewport",
-                )
-                extract_btn = gr.Button("🚀 Extract Tokens", variant="primary")
-            extraction_status = gr.Markdown("")
-            with gr.Tabs():
-                with gr.Tab("🎨 Colors"):
-                    colors_table = gr.Dataframe(
-                        headers=["Accept", "Color", "Frequency", "Context", "Contrast (White)", "AA Text", "Confidence"],
-                        datatype=["bool", "str", "number", "str", "str", "str", "str"],
-                        interactive=True,
-                        label="Extracted Colors",
-                    )
-                with gr.Tab("📝 Typography"):
-                    typography_table = gr.Dataframe(
-                        headers=["Accept", "Font", "Size", "Weight", "Line Height", "Elements", "Frequency"],
-                        datatype=["bool", "str", "str", "number", "str", "str", "number"],
-                        interactive=True,
-                        label="Extracted Typography",
-                    )
-                with gr.Tab("📏 Spacing"):
-                    spacing_table = gr.Dataframe(
-                        headers=["Accept", "Value", "Frequency", "Context", "Fits 8px", "Outlier"],
-                        datatype=["bool", "str", "number", "str", "str", "str"],
-                        interactive=True,
-                        label="Extracted Spacing",
-                    )
-        # =================================================================
-        # STAGE 3: Export
-        # =================================================================
-        with gr.Accordion("📦 Stage 3: Export", open=False):
-            gr.Markdown("""
-            **Step 3:** Review and export your design tokens.
-            """)
-            with gr.Row():
-                export_btn = gr.Button("📥 Export JSON", variant="secondary")
-            export_output = gr.Code(
-                label="Exported Tokens (JSON)",
-                language="json",
-                lines=20,
-            )
-        # =================================================================
-        # EVENT HANDLERS
-        # =================================================================
-        # Discovery
-        discover_btn.click(
-            fn=discover_site_pages,
-            inputs=[url_input],
-            outputs=[discovery_status, pages_table, pages_json],
-        ).then(
-            fn=lambda: gr.update(visible=True),
-            outputs=[pages_table],
-        )
-        # Extraction
-        extract_btn.click(
-            fn=start_extraction,
-            inputs=[pages_table, viewport_radio],
-            outputs=[extraction_status, colors_table, typography_table, spacing_table],
-        )
-        # Export
-        export_btn.click(
-            fn=export_tokens_json,
-            outputs=[export_output],
-        )
-        # =================================================================
-        # FOOTER
-        # =================================================================
-        gr.Markdown("""
-        ---
-        **Design System Extractor v2** | Built with LangGraph + Gradio
-        *A semi-automated co-pilot for design system recovery and modernization.*
-        """)
-    return app
-# =============================================================================
-# MAIN
-# =============================================================================
-def main():
-    """Main entry point."""
-    settings = get_settings()
-    # Validate settings
-    errors = settings.validate()
-    if errors and not is_debug():
-        print("Configuration errors:")
-        for error in errors:
-            print(f"  - {error}")
-        print("\nSet DEBUG=true to continue anyway.")
-        return
-    # Create and launch app
-    app = create_ui()
-    app.launch(
-        server_port=settings.ui.server_port,
-        share=settings.ui.share,
-        debug=settings.debug,
-    )
-if __name__ == "__main__":
-    main()